{ "metadata": { "total_size": 70801904048 }, "weight_map": { "layers.0.attention.kv_a_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.0.attention.q_a_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.0.attention.wkv_a_with_mqa.weight": "consolidated-00001-of-00013.safetensors", "layers.0.attention.wkv_b.weight": "consolidated-00001-of-00013.safetensors", "layers.0.attention.wo.weight": "consolidated-00001-of-00013.safetensors", "layers.0.attention.wq_a.weight": "consolidated-00001-of-00013.safetensors", "layers.0.attention.wq_b.weight": "consolidated-00001-of-00013.safetensors", "layers.0.attention_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.0.experts.0.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.0.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.0.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.0.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.0.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.0.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.0.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.0.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.0.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.1.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.1.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.1.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.1.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.1.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.1.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.1.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.1.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.1.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.10.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.10.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.10.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.10.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.10.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.10.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.10.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.10.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.10.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.100.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.100.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.100.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.100.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.100.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.100.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.100.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.100.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.100.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.101.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.101.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.101.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.101.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.101.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.101.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.101.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.101.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.101.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.102.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.102.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.102.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.102.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.102.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.102.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.102.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.102.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.102.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.103.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.103.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.103.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.103.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.103.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.103.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.103.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.103.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.103.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.104.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.104.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.104.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.104.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.104.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.104.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.104.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.104.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.104.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.105.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.105.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.105.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.105.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.105.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.105.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.105.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.105.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.105.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.106.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.106.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.106.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.106.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.106.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.106.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.106.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.106.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.106.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.107.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.107.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.107.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.107.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.107.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.107.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.107.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.107.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.107.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.108.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.108.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.108.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.108.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.108.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.108.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.108.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.108.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.108.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.109.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.109.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.109.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.109.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.109.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.109.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.109.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.109.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.109.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.11.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.11.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.11.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.11.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.11.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.11.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.11.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.11.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.11.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.110.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.110.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.110.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.110.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.110.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.110.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.110.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.110.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.110.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.111.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.111.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.111.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.111.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.111.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.111.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.111.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.111.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.111.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.112.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.112.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.112.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.112.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.112.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.112.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.112.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.112.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.112.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.113.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.113.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.113.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.113.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.113.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.113.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.113.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.113.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.113.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.114.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.114.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.114.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.114.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.114.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.114.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.114.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.114.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.114.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.115.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.115.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.115.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.115.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.115.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.115.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.115.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.115.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.115.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.116.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.116.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.116.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.116.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.116.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.116.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.116.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.116.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.116.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.117.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.117.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.117.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.117.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.117.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.117.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.117.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.117.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.117.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.118.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.118.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.118.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.118.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.118.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.118.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.118.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.118.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.118.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.119.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.119.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.119.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.119.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.119.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.119.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.119.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.119.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.119.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.12.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.12.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.12.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.12.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.12.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.12.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.12.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.12.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.12.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.120.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.120.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.120.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.120.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.120.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.120.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.120.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.120.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.120.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.121.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.121.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.121.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.121.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.121.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.121.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.121.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.121.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.121.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.122.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.122.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.122.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.122.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.122.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.122.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.122.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.122.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.122.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.123.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.123.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.123.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.123.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.123.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.123.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.123.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.123.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.123.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.124.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.124.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.124.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.124.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.124.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.124.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.124.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.124.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.124.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.125.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.125.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.125.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.125.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.125.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.125.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.125.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.125.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.125.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.126.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.126.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.126.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.126.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.126.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.126.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.126.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.126.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.126.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.127.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.127.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.127.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.127.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.127.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.127.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.127.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.127.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.127.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.13.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.13.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.13.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.13.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.13.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.13.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.13.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.13.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.13.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.14.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.14.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.14.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.14.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.14.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.14.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.14.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.14.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.14.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.15.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.15.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.15.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.15.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.15.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.15.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.15.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.15.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.15.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.16.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.16.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.16.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.16.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.16.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.16.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.16.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.16.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.16.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.17.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.17.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.17.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.17.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.17.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.17.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.17.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.17.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.17.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.18.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.18.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.18.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.18.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.18.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.18.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.18.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.18.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.18.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.19.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.19.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.19.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.19.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.19.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.19.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.19.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.19.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.19.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.2.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.2.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.2.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.2.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.2.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.2.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.2.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.2.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.2.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.20.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.20.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.20.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.20.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.20.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.20.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.20.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.20.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.20.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.21.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.21.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.21.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.21.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.21.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.21.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.21.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.21.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.21.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.22.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.22.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.22.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.22.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.22.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.22.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.22.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.22.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.22.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.23.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.23.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.23.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.23.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.23.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.23.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.23.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.23.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.23.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.24.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.24.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.24.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.24.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.24.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.24.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.24.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.24.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.24.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.25.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.25.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.25.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.25.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.25.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.25.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.25.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.25.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.25.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.26.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.26.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.26.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.26.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.26.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.26.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.26.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.26.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.26.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.27.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.27.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.27.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.27.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.27.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.27.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.27.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.27.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.27.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.28.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.28.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.28.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.28.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.28.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.28.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.28.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.28.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.28.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.29.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.29.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.29.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.29.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.29.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.29.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.29.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.29.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.29.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.3.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.3.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.3.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.3.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.3.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.3.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.3.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.3.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.3.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.30.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.30.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.30.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.30.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.30.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.30.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.30.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.30.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.30.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.31.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.31.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.31.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.31.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.31.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.31.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.31.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.31.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.31.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.32.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.32.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.32.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.32.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.32.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.32.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.32.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.32.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.32.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.33.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.33.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.33.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.33.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.33.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.33.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.33.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.33.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.33.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.34.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.34.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.34.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.34.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.34.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.34.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.34.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.34.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.34.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.35.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.35.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.35.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.35.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.35.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.35.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.35.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.35.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.35.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.36.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.36.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.36.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.36.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.36.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.36.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.36.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.36.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.36.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.37.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.37.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.37.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.37.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.37.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.37.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.37.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.37.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.37.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.38.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.38.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.38.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.38.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.38.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.38.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.38.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.38.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.38.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.39.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.39.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.39.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.39.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.39.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.39.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.39.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.39.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.39.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.4.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.4.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.4.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.4.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.4.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.4.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.4.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.4.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.4.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.40.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.40.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.40.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.40.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.40.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.40.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.40.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.40.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.40.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.41.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.41.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.41.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.41.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.41.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.41.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.41.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.41.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.41.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.42.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.42.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.42.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.42.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.42.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.42.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.42.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.42.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.42.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.43.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.43.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.43.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.43.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.43.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.43.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.43.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.43.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.43.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.44.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.44.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.44.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.44.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.44.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.44.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.44.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.44.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.44.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.45.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.45.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.45.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.45.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.45.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.45.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.45.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.45.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.45.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.46.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.46.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.46.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.46.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.46.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.46.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.46.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.46.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.46.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.47.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.47.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.47.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.47.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.47.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.47.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.47.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.47.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.47.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.48.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.48.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.48.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.48.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.48.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.48.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.48.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.48.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.48.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.49.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.49.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.49.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.49.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.49.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.49.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.49.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.49.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.49.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.5.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.5.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.5.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.5.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.5.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.5.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.5.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.5.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.5.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.50.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.50.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.50.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.50.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.50.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.50.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.50.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.50.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.50.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.51.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.51.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.51.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.51.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.51.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.51.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.51.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.51.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.51.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.52.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.52.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.52.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.52.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.52.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.52.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.52.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.52.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.52.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.53.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.53.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.53.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.53.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.53.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.53.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.53.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.53.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.53.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.54.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.54.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.54.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.54.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.54.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.54.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.54.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.54.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.54.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.55.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.55.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.55.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.55.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.55.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.55.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.55.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.55.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.55.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.56.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.56.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.56.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.56.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.56.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.56.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.56.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.56.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.56.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.57.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.57.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.57.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.57.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.57.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.57.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.57.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.57.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.57.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.58.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.58.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.58.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.58.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.58.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.58.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.58.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.58.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.58.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.59.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.59.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.59.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.59.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.59.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.59.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.59.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.59.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.59.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.6.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.6.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.6.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.6.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.6.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.6.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.6.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.6.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.6.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.60.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.60.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.60.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.60.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.60.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.60.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.60.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.60.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.60.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.61.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.61.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.61.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.61.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.61.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.61.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.61.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.61.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.61.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.62.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.62.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.62.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.62.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.62.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.62.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.62.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.62.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.62.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.63.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.63.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.63.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.63.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.63.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.63.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.63.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.63.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.63.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.64.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.64.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.64.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.64.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.64.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.64.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.64.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.64.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.64.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.65.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.65.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.65.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.65.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.65.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.65.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.65.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.65.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.65.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.66.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.66.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.66.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.66.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.66.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.66.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.66.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.66.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.66.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.67.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.67.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.67.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.67.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.67.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.67.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.67.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.67.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.67.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.68.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.68.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.68.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.68.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.68.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.68.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.68.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.68.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.68.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.69.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.69.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.69.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.69.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.69.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.69.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.69.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.69.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.69.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.7.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.7.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.7.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.7.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.7.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.7.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.7.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.7.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.7.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.70.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.70.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.70.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.70.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.70.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.70.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.70.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.70.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.70.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.71.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.71.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.71.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.71.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.71.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.71.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.71.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.71.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.71.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.72.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.72.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.72.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.72.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.72.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.72.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.72.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.72.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.72.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.73.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.73.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.73.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.73.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.73.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.73.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.73.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.73.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.73.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.74.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.74.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.74.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.74.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.74.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.74.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.74.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.74.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.74.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.75.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.75.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.75.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.75.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.75.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.75.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.75.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.75.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.75.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.76.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.76.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.76.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.76.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.76.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.76.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.76.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.76.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.76.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.77.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.77.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.77.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.77.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.77.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.77.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.77.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.77.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.77.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.78.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.78.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.78.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.78.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.78.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.78.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.78.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.78.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.78.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.79.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.79.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.79.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.79.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.79.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.79.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.79.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.79.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.79.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.8.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.8.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.8.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.8.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.8.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.8.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.8.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.8.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.8.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.80.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.80.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.80.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.80.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.80.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.80.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.80.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.80.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.80.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.81.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.81.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.81.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.81.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.81.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.81.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.81.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.81.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.81.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.82.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.82.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.82.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.82.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.82.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.82.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.82.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.82.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.82.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.83.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.83.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.83.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.83.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.83.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.83.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.83.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.83.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.83.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.84.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.84.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.84.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.84.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.84.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.84.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.84.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.84.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.84.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.85.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.85.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.85.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.85.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.85.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.85.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.85.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.85.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.85.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.86.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.86.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.86.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.86.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.86.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.86.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.86.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.86.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.86.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.87.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.87.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.87.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.87.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.87.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.87.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.87.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.87.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.87.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.88.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.88.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.88.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.88.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.88.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.88.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.88.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.88.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.88.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.89.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.89.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.89.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.89.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.89.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.89.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.89.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.89.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.89.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.9.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.9.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.9.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.9.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.9.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.9.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.9.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.9.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.9.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.90.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.90.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.90.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.90.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.90.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.90.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.90.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.90.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.90.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.91.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.91.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.91.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.91.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.91.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.91.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.91.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.91.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.91.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.92.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.92.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.92.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.92.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.92.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.92.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.92.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.92.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.92.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.93.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.93.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.93.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.93.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.93.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.93.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.93.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.93.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.93.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.94.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.94.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.94.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.94.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.94.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.94.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.94.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.94.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.94.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.95.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.95.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.95.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.95.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.95.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.95.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.95.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.95.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.95.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.96.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.96.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.96.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.96.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.96.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.96.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.96.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.96.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.96.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.97.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.97.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.97.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.97.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.97.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.97.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.97.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.97.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.97.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.98.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.98.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.98.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.98.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.98.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.98.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.98.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.98.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.98.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.99.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.99.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.99.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.99.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.99.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.99.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.99.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.experts.99.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.experts.99.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.ffn_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.0.gate.weight": "consolidated-00001-of-00013.safetensors", "layers.0.shared_experts.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.shared_experts.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.shared_experts.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.shared_experts.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.shared_experts.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.shared_experts.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.0.shared_experts.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.0.shared_experts.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.0.shared_experts.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.attention.kv_a_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.1.attention.q_a_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.1.attention.wkv_a_with_mqa.weight": "consolidated-00001-of-00013.safetensors", "layers.1.attention.wkv_b.weight": "consolidated-00001-of-00013.safetensors", "layers.1.attention.wo.weight": "consolidated-00001-of-00013.safetensors", "layers.1.attention.wq_a.weight": "consolidated-00001-of-00013.safetensors", "layers.1.attention.wq_b.weight": "consolidated-00001-of-00013.safetensors", "layers.1.attention_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.1.experts.0.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.0.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.0.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.0.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.0.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.0.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.0.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.0.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.0.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.1.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.1.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.1.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.1.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.1.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.1.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.1.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.1.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.1.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.10.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.10.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.10.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.10.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.10.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.10.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.10.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.10.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.10.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.100.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.100.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.100.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.100.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.100.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.100.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.100.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.100.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.100.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.101.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.101.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.101.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.101.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.101.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.101.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.101.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.101.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.101.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.102.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.102.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.102.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.102.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.102.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.102.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.102.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.102.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.102.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.103.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.103.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.103.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.103.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.103.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.103.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.103.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.103.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.103.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.104.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.104.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.104.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.104.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.104.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.104.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.104.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.104.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.104.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.105.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.105.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.105.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.105.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.105.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.105.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.105.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.105.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.105.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.106.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.106.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.106.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.106.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.106.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.106.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.106.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.106.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.106.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.107.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.107.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.107.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.107.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.107.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.107.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.107.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.107.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.107.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.108.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.108.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.108.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.108.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.108.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.108.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.108.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.108.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.108.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.109.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.109.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.109.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.109.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.109.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.109.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.109.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.109.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.109.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.11.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.11.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.11.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.11.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.11.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.11.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.11.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.11.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.11.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.110.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.110.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.110.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.110.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.110.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.110.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.110.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.110.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.110.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.111.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.111.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.111.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.111.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.111.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.111.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.111.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.111.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.111.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.112.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.112.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.112.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.112.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.112.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.112.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.112.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.112.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.112.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.113.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.113.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.113.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.113.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.113.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.113.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.113.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.113.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.113.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.114.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.114.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.114.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.114.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.114.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.114.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.114.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.114.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.114.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.115.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.115.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.115.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.115.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.115.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.115.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.115.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.115.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.115.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.116.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.116.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.116.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.116.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.116.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.116.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.116.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.116.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.116.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.117.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.117.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.117.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.117.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.117.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.117.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.117.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.117.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.117.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.118.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.118.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.118.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.118.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.118.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.118.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.118.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.118.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.118.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.119.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.119.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.119.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.119.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.119.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.119.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.119.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.119.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.119.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.12.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.12.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.12.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.12.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.12.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.12.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.12.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.12.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.12.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.120.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.120.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.120.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.120.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.120.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.120.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.120.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.120.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.120.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.121.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.121.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.121.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.121.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.121.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.121.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.121.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.121.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.121.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.122.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.122.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.122.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.122.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.122.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.122.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.122.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.122.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.122.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.123.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.123.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.123.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.123.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.123.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.123.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.123.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.123.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.123.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.124.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.124.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.124.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.124.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.124.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.124.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.124.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.124.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.124.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.125.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.125.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.125.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.125.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.125.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.125.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.125.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.125.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.125.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.126.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.126.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.126.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.126.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.126.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.126.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.126.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.126.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.126.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.127.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.127.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.127.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.127.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.127.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.127.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.127.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.127.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.127.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.13.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.13.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.13.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.13.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.13.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.13.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.13.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.13.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.13.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.14.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.14.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.14.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.14.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.14.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.14.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.14.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.14.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.14.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.15.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.15.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.15.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.15.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.15.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.15.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.15.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.15.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.15.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.16.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.16.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.16.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.16.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.16.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.16.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.16.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.16.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.16.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.17.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.17.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.17.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.17.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.17.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.17.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.17.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.17.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.17.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.18.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.18.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.18.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.18.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.18.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.18.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.18.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.18.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.18.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.19.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.19.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.19.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.19.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.19.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.19.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.19.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.19.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.19.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.2.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.2.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.2.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.2.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.2.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.2.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.2.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.2.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.2.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.20.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.20.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.20.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.20.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.20.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.20.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.20.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.20.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.20.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.21.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.21.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.21.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.21.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.21.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.21.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.21.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.21.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.21.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.22.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.22.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.22.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.22.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.22.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.22.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.22.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.22.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.22.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.23.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.23.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.23.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.23.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.23.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.23.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.23.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.23.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.23.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.24.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.24.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.24.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.24.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.24.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.24.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.24.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.24.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.24.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.25.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.25.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.25.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.25.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.25.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.25.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.25.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.25.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.25.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.26.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.26.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.26.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.26.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.26.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.26.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.26.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.26.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.26.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.27.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.27.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.27.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.27.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.27.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.27.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.27.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.27.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.27.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.28.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.28.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.28.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.28.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.28.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.28.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.28.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.28.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.28.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.29.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.29.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.29.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.29.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.29.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.29.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.29.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.29.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.29.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.3.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.3.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.3.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.3.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.3.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.3.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.3.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.3.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.3.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.30.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.30.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.30.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.30.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.30.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.30.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.30.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.30.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.30.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.31.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.31.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.31.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.31.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.31.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.31.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.31.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.31.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.31.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.32.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.32.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.32.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.32.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.32.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.32.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.32.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.32.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.32.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.33.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.33.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.33.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.33.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.33.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.33.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.33.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.33.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.33.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.34.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.34.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.34.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.34.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.34.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.34.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.34.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.34.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.34.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.35.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.35.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.35.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.35.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.35.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.35.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.35.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.35.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.35.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.36.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.36.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.36.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.36.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.36.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.36.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.36.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.36.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.36.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.37.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.37.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.37.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.37.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.37.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.37.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.37.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.37.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.37.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.38.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.38.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.38.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.38.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.38.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.38.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.38.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.38.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.38.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.39.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.39.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.39.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.39.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.39.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.39.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.39.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.39.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.39.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.4.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.4.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.4.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.4.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.4.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.4.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.4.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.4.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.4.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.40.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.40.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.40.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.40.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.40.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.40.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.40.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.40.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.40.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.41.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.41.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.41.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.41.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.41.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.41.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.41.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.41.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.41.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.42.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.42.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.42.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.42.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.42.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.42.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.42.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.42.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.42.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.43.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.43.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.43.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.43.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.43.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.43.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.43.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.43.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.43.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.44.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.44.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.44.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.44.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.44.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.44.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.44.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.44.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.44.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.45.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.45.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.45.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.45.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.45.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.45.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.45.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.45.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.45.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.46.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.46.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.46.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.46.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.46.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.46.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.46.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.46.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.46.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.47.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.47.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.47.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.47.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.47.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.47.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.47.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.47.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.47.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.48.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.48.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.48.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.48.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.48.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.48.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.48.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.48.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.48.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.49.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.49.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.49.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.49.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.49.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.49.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.49.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.49.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.49.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.5.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.5.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.5.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.5.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.5.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.5.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.5.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.5.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.5.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.50.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.50.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.50.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.50.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.50.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.50.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.50.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.50.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.50.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.51.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.51.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.51.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.51.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.51.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.51.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.51.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.51.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.51.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.52.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.52.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.52.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.52.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.52.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.52.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.52.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.52.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.52.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.53.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.53.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.53.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.53.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.53.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.53.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.53.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.53.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.53.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.54.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.54.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.54.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.54.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.54.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.54.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.54.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.54.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.54.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.55.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.55.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.55.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.55.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.55.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.55.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.55.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.55.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.55.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.56.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.56.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.56.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.56.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.56.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.56.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.56.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.56.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.56.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.57.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.57.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.57.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.57.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.57.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.57.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.57.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.57.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.57.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.58.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.58.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.58.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.58.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.58.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.58.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.58.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.58.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.58.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.59.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.59.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.59.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.59.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.59.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.59.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.59.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.59.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.59.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.6.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.6.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.6.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.6.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.6.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.6.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.6.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.6.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.6.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.60.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.60.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.60.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.60.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.60.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.60.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.60.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.60.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.60.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.61.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.61.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.61.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.61.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.61.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.61.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.61.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.61.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.61.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.62.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.62.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.62.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.62.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.62.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.62.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.62.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.62.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.62.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.63.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.63.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.63.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.63.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.63.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.63.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.63.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.63.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.63.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.64.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.64.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.64.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.64.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.64.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.64.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.64.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.64.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.64.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.65.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.65.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.65.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.65.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.65.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.65.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.65.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.65.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.65.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.66.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.66.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.66.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.66.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.66.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.66.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.66.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.66.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.66.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.67.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.67.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.67.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.67.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.67.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.67.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.67.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.67.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.67.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.68.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.68.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.68.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.68.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.68.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.68.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.68.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.68.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.68.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.69.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.69.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.69.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.69.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.69.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.69.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.69.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.69.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.69.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.7.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.7.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.7.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.7.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.7.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.7.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.7.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.7.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.7.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.70.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.70.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.70.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.70.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.70.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.70.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.70.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.70.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.70.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.71.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.71.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.71.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.71.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.71.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.71.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.71.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.71.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.71.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.72.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.72.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.72.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.72.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.72.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.72.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.72.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.72.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.72.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.73.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.73.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.73.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.73.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.73.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.73.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.73.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.73.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.73.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.74.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.74.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.74.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.74.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.74.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.74.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.74.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.74.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.74.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.75.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.75.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.75.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.75.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.75.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.75.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.75.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.75.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.75.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.76.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.76.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.76.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.76.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.76.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.76.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.76.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.76.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.76.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.77.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.77.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.77.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.77.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.77.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.77.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.77.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.77.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.77.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.78.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.78.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.78.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.78.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.78.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.78.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.78.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.78.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.78.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.79.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.79.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.79.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.79.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.79.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.79.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.79.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.79.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.79.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.8.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.8.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.8.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.8.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.8.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.8.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.8.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.8.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.8.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.80.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.80.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.80.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.80.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.80.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.80.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.80.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.80.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.80.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.81.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.81.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.81.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.81.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.81.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.81.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.81.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.81.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.81.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.82.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.82.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.82.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.82.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.82.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.82.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.82.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.82.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.82.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.83.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.83.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.83.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.83.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.83.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.83.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.83.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.83.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.83.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.84.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.84.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.84.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.84.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.84.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.84.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.84.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.84.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.84.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.85.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.85.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.85.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.85.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.85.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.85.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.85.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.85.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.85.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.86.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.86.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.86.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.86.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.86.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.86.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.86.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.86.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.86.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.87.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.87.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.87.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.87.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.87.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.87.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.87.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.87.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.87.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.88.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.88.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.88.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.88.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.88.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.88.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.88.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.88.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.88.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.89.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.89.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.89.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.89.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.89.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.89.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.89.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.89.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.89.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.9.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.9.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.9.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.9.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.9.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.9.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.9.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.9.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.9.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.90.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.90.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.90.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.90.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.90.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.90.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.90.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.90.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.90.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.91.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.91.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.91.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.91.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.91.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.91.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.91.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.91.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.91.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.92.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.92.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.92.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.92.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.92.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.92.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.92.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.92.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.92.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.93.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.93.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.93.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.93.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.93.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.93.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.93.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.93.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.93.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.94.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.94.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.94.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.94.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.94.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.94.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.94.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.94.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.94.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.95.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.95.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.95.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.95.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.95.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.95.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.95.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.95.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.95.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.96.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.96.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.96.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.96.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.96.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.96.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.96.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.96.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.96.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.97.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.97.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.97.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.97.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.97.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.97.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.97.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.97.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.97.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.98.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.98.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.98.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.98.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.98.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.98.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.98.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.98.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.98.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.99.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.99.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.99.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.99.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.99.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.99.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.99.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.experts.99.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.experts.99.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.ffn_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.1.gate.weight": "consolidated-00001-of-00013.safetensors", "layers.1.shared_experts.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.shared_experts.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.shared_experts.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.shared_experts.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.shared_experts.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.shared_experts.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.1.shared_experts.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.1.shared_experts.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.1.shared_experts.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.attention.kv_a_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.10.attention.q_a_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.10.attention.wkv_a_with_mqa.weight": "consolidated-00001-of-00013.safetensors", "layers.10.attention.wkv_b.weight": "consolidated-00001-of-00013.safetensors", "layers.10.attention.wo.weight": "consolidated-00001-of-00013.safetensors", "layers.10.attention.wq_a.weight": "consolidated-00001-of-00013.safetensors", "layers.10.attention.wq_b.weight": "consolidated-00001-of-00013.safetensors", "layers.10.attention_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.10.experts.0.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.0.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.0.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.0.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.0.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.0.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.0.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.0.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.0.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.1.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.1.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.1.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.1.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.1.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.1.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.1.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.1.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.1.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.10.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.10.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.10.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.10.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.10.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.10.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.10.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.10.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.10.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.100.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.100.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.100.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.100.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.100.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.100.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.100.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.100.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.100.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.101.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.101.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.101.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.101.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.101.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.101.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.101.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.101.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.101.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.102.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.102.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.102.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.102.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.102.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.102.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.102.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.102.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.102.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.103.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.103.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.103.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.103.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.103.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.103.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.103.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.103.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.103.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.104.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.104.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.104.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.104.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.104.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.104.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.104.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.104.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.104.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.105.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.105.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.105.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.105.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.105.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.105.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.105.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.105.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.105.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.106.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.106.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.106.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.106.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.106.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.106.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.106.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.106.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.106.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.107.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.107.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.107.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.107.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.107.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.107.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.107.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.107.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.107.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.108.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.108.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.108.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.108.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.108.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.108.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.108.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.108.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.108.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.109.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.109.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.109.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.109.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.109.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.109.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.109.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.109.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.109.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.11.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.11.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.11.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.11.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.11.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.11.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.11.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.11.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.11.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.110.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.110.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.110.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.110.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.110.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.110.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.110.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.110.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.110.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.111.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.111.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.111.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.111.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.111.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.111.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.111.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.111.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.111.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.112.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.112.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.112.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.112.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.112.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.112.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.112.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.112.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.112.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.113.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.113.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.113.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.113.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.113.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.113.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.113.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.113.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.113.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.114.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.114.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.114.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.114.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.114.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.114.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.114.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.114.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.114.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.115.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.115.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.115.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.115.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.115.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.115.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.115.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.115.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.115.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.116.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.116.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.116.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.116.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.116.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.116.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.116.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.116.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.116.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.117.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.117.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.117.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.117.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.117.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.117.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.117.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.117.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.117.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.118.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.118.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.118.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.118.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.118.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.118.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.118.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.118.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.118.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.119.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.119.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.119.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.119.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.119.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.119.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.119.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.119.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.119.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.12.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.12.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.12.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.12.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.12.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.12.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.12.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.12.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.12.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.120.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.120.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.120.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.120.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.120.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.120.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.120.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.120.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.120.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.121.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.121.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.121.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.121.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.121.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.121.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.121.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.121.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.121.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.122.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.122.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.122.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.122.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.122.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.122.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.122.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.122.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.122.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.123.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.123.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.123.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.123.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.123.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.123.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.123.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.123.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.123.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.124.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.124.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.124.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.124.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.124.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.124.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.124.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.124.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.124.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.125.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.125.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.125.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.125.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.125.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.125.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.125.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.125.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.125.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.126.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.126.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.126.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.126.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.126.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.126.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.126.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.126.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.126.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.127.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.127.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.127.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.127.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.127.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.127.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.127.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.127.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.127.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.13.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.13.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.13.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.13.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.13.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.13.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.13.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.13.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.13.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.14.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.14.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.14.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.14.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.14.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.14.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.14.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.14.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.14.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.15.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.15.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.15.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.15.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.15.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.15.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.15.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.15.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.15.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.16.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.16.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.16.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.16.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.16.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.16.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.16.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.16.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.16.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.17.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.17.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.17.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.17.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.17.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.17.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.17.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.17.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.17.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.18.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.18.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.18.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.18.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.18.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.18.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.18.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.18.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.18.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.19.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.19.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.19.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.19.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.19.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.19.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.19.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.19.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.19.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.2.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.2.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.2.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.2.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.2.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.2.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.2.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.2.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.2.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.20.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.20.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.20.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.20.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.20.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.20.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.20.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.20.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.20.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.21.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.21.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.21.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.21.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.21.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.21.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.21.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.21.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.21.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.22.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.22.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.22.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.22.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.22.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.22.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.22.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.22.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.22.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.23.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.23.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.23.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.23.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.23.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.23.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.23.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.23.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.23.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.24.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.24.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.24.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.24.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.24.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.24.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.24.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.24.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.24.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.25.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.25.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.25.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.25.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.25.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.25.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.25.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.25.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.25.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.26.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.26.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.26.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.26.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.26.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.26.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.26.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.26.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.26.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.27.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.27.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.27.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.27.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.27.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.27.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.27.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.27.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.27.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.28.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.28.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.28.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.28.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.28.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.28.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.28.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.28.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.28.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.29.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.29.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.29.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.29.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.29.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.29.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.29.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.29.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.29.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.3.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.3.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.3.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.3.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.3.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.3.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.3.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.3.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.3.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.30.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.30.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.30.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.30.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.30.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.30.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.30.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.30.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.30.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.31.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.31.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.31.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.31.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.31.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.31.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.31.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.31.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.31.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.32.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.32.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.32.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.32.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.32.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.32.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.32.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.32.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.32.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.33.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.33.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.33.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.33.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.33.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.33.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.33.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.33.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.33.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.34.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.34.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.34.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.34.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.34.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.34.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.34.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.34.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.34.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.35.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.35.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.35.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.35.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.35.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.35.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.35.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.35.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.35.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.36.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.36.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.36.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.36.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.36.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.36.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.36.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.36.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.36.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.37.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.37.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.37.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.37.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.37.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.37.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.37.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.37.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.37.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.38.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.38.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.38.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.38.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.38.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.38.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.38.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.38.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.38.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.39.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.39.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.39.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.39.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.39.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.39.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.39.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.39.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.39.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.4.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.4.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.4.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.4.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.4.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.4.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.4.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.4.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.4.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.40.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.40.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.40.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.40.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.40.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.40.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.40.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.40.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.40.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.41.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.41.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.41.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.41.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.41.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.41.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.41.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.41.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.41.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.42.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.42.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.42.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.42.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.42.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.42.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.42.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.42.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.42.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.43.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.43.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.43.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.43.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.43.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.43.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.43.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.43.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.43.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.44.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.44.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.44.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.44.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.44.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.44.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.44.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.44.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.44.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.45.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.45.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.45.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.45.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.45.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.45.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.45.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.45.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.45.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.46.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.46.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.46.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.46.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.46.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.46.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.46.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.46.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.46.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.47.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.47.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.47.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.47.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.47.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.47.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.47.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.47.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.47.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.48.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.48.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.48.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.48.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.48.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.48.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.48.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.48.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.48.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.49.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.49.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.49.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.49.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.49.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.49.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.49.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.49.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.49.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.5.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.5.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.5.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.5.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.5.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.5.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.5.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.5.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.5.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.50.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.50.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.50.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.50.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.50.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.50.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.50.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.50.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.50.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.51.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.51.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.51.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.51.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.51.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.51.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.51.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.51.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.51.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.52.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.52.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.52.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.52.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.52.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.52.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.52.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.52.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.52.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.53.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.53.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.53.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.53.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.53.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.53.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.53.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.53.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.53.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.54.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.54.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.54.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.54.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.54.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.54.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.54.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.54.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.54.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.55.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.55.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.55.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.55.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.55.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.55.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.55.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.55.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.55.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.56.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.56.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.56.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.56.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.56.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.56.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.56.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.56.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.56.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.57.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.57.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.57.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.57.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.57.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.57.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.57.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.57.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.57.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.58.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.58.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.58.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.58.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.58.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.58.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.58.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.58.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.58.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.59.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.59.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.59.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.59.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.59.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.59.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.59.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.59.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.59.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.6.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.6.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.6.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.6.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.6.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.6.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.6.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.6.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.6.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.60.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.60.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.60.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.60.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.60.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.60.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.60.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.60.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.60.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.61.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.61.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.61.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.61.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.61.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.61.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.61.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.61.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.61.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.62.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.62.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.62.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.62.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.62.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.62.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.62.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.62.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.62.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.63.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.63.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.63.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.63.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.63.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.63.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.63.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.63.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.63.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.64.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.64.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.64.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.64.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.64.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.64.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.64.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.64.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.64.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.65.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.65.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.65.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.65.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.65.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.65.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.65.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.65.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.65.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.66.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.66.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.66.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.66.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.66.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.66.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.66.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.66.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.66.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.67.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.67.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.67.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.67.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.67.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.67.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.67.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.67.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.67.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.68.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.68.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.68.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.68.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.68.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.68.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.68.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.68.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.68.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.69.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.69.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.69.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.69.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.69.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.69.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.69.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.69.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.69.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.7.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.7.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.7.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.7.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.7.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.7.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.7.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.7.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.7.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.70.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.70.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.70.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.70.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.70.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.70.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.70.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.70.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.70.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.71.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.71.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.71.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.71.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.71.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.71.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.71.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.71.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.71.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.72.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.72.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.72.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.72.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.72.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.72.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.72.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.72.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.72.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.73.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.73.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.73.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.73.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.73.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.73.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.73.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.73.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.73.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.74.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.74.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.74.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.74.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.74.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.74.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.74.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.74.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.74.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.75.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.75.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.75.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.75.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.75.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.75.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.75.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.75.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.75.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.76.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.76.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.76.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.76.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.76.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.76.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.76.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.76.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.76.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.77.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.77.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.77.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.77.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.77.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.77.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.77.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.77.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.77.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.78.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.78.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.78.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.78.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.78.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.78.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.78.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.78.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.78.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.79.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.79.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.79.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.79.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.79.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.79.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.79.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.79.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.79.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.8.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.8.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.8.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.8.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.8.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.8.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.8.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.8.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.8.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.80.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.80.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.80.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.80.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.80.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.80.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.80.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.80.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.80.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.81.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.81.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.81.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.81.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.81.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.81.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.81.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.81.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.81.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.82.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.82.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.82.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.82.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.82.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.82.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.82.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.82.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.82.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.83.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.83.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.83.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.83.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.83.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.83.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.83.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.83.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.83.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.84.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.84.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.84.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.84.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.84.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.84.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.84.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.84.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.84.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.85.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.85.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.85.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.85.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.85.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.85.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.85.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.85.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.85.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.86.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.86.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.86.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.86.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.86.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.86.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.86.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.86.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.86.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.87.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.87.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.87.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.87.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.87.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.87.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.87.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.87.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.87.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.88.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.88.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.88.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.88.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.88.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.88.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.88.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.88.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.88.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.89.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.89.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.89.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.89.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.89.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.89.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.89.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.89.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.89.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.9.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.9.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.9.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.9.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.9.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.9.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.9.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.9.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.9.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.90.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.90.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.90.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.90.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.90.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.90.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.90.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.90.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.90.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.91.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.91.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.91.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.91.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.91.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.91.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.91.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.91.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.91.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.92.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.92.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.92.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.92.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.92.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.92.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.92.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.92.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.92.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.93.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.93.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.93.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.93.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.93.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.93.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.93.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.93.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.93.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.94.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.94.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.94.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.94.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.94.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.94.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.94.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.94.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.94.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.95.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.95.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.95.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.95.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.95.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.95.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.95.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.95.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.95.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.96.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.96.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.96.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.96.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.96.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.96.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.96.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.96.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.96.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.97.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.97.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.97.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.97.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.97.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.97.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.97.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.97.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.97.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.98.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.98.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.98.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.98.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.98.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.98.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.98.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.98.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.98.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.99.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.99.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.99.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.99.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.99.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.99.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.99.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.experts.99.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.experts.99.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.ffn_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.10.gate.weight": "consolidated-00001-of-00013.safetensors", "layers.10.shared_experts.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.shared_experts.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.shared_experts.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.shared_experts.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.shared_experts.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.shared_experts.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.10.shared_experts.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.10.shared_experts.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.10.shared_experts.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.attention.kv_a_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.11.attention.q_a_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.11.attention.wkv_a_with_mqa.weight": "consolidated-00001-of-00013.safetensors", "layers.11.attention.wkv_b.weight": "consolidated-00001-of-00013.safetensors", "layers.11.attention.wo.weight": "consolidated-00001-of-00013.safetensors", "layers.11.attention.wq_a.weight": "consolidated-00001-of-00013.safetensors", "layers.11.attention.wq_b.weight": "consolidated-00001-of-00013.safetensors", "layers.11.attention_norm.weight": "consolidated-00001-of-00013.safetensors", "layers.11.experts.0.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.0.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.0.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.0.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.0.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.0.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.0.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.0.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.0.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.1.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.1.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.1.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.1.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.1.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.1.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.1.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.1.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.1.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.10.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.10.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.10.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.10.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.10.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.10.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.10.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.10.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.10.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.100.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.100.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.100.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.100.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.100.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.100.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.100.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.100.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.100.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.101.w1.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.101.w1.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.101.w1.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.101.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.101.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.101.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.101.w3.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.101.w3.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.101.w3.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.102.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.102.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.102.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.102.w2.weight_global_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.102.w2.weight_packed": "consolidated-00001-of-00013.safetensors", "layers.11.experts.102.w2.weight_scale": "consolidated-00001-of-00013.safetensors", "layers.11.experts.102.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.102.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.102.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.103.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.103.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.103.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.103.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.103.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.103.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.103.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.103.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.103.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.104.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.104.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.104.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.104.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.104.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.104.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.104.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.104.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.104.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.105.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.105.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.105.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.105.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.105.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.105.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.105.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.105.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.105.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.106.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.106.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.106.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.106.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.106.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.106.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.106.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.106.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.106.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.107.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.107.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.107.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.107.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.107.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.107.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.107.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.107.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.107.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.108.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.108.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.108.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.108.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.108.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.108.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.108.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.108.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.108.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.109.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.109.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.109.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.109.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.109.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.109.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.109.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.109.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.109.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.11.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.11.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.11.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.11.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.11.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.11.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.11.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.11.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.11.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.110.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.110.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.110.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.110.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.110.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.110.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.110.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.110.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.110.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.111.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.111.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.111.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.111.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.111.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.111.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.111.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.111.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.111.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.112.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.112.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.112.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.112.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.112.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.112.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.112.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.112.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.112.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.113.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.113.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.113.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.113.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.113.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.113.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.113.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.113.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.113.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.114.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.114.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.114.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.114.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.114.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.114.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.114.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.114.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.114.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.115.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.115.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.115.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.115.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.115.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.115.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.115.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.115.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.115.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.116.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.116.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.116.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.116.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.116.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.116.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.116.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.116.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.116.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.117.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.117.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.117.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.117.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.117.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.117.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.117.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.117.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.117.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.118.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.118.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.118.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.118.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.118.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.118.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.118.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.118.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.118.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.119.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.119.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.119.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.119.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.119.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.119.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.119.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.119.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.119.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.12.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.12.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.12.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.12.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.12.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.12.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.12.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.12.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.12.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.120.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.120.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.120.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.120.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.120.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.120.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.120.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.120.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.120.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.121.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.121.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.121.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.121.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.121.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.121.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.121.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.121.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.121.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.122.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.122.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.122.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.122.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.122.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.122.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.122.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.122.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.122.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.123.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.123.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.123.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.123.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.123.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.123.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.123.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.123.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.123.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.124.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.124.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.124.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.124.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.124.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.124.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.124.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.124.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.124.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.125.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.125.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.125.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.125.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.125.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.125.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.125.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.125.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.125.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.126.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.126.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.126.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.126.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.126.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.126.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.126.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.126.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.126.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.127.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.127.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.127.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.127.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.127.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.127.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.127.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.127.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.127.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.13.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.13.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.13.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.13.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.13.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.13.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.13.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.13.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.13.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.14.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.14.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.14.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.14.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.14.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.14.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.14.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.14.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.14.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.15.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.15.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.15.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.15.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.15.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.15.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.15.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.15.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.15.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.16.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.16.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.16.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.16.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.16.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.16.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.16.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.16.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.16.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.17.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.17.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.17.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.17.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.17.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.17.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.17.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.17.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.17.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.18.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.18.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.18.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.18.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.18.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.18.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.18.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.18.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.18.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.19.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.19.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.19.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.19.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.19.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.19.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.19.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.19.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.19.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.2.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.2.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.2.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.2.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.2.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.2.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.2.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.2.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.2.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.20.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.20.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.20.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.20.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.20.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.20.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.20.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.20.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.20.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.21.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.21.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.21.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.21.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.21.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.21.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.21.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.21.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.21.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.22.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.22.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.22.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.22.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.22.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.22.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.22.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.22.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.22.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.23.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.23.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.23.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.23.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.23.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.23.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.23.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.23.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.23.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.24.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.24.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.24.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.24.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.24.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.24.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.24.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.24.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.24.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.25.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.25.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.25.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.25.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.25.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.25.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.25.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.25.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.25.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.26.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.26.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.26.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.26.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.26.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.26.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.26.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.26.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.26.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.27.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.27.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.27.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.27.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.27.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.27.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.27.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.27.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.27.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.28.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.28.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.28.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.28.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.28.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.28.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.28.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.28.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.28.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.29.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.29.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.29.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.29.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.29.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.29.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.29.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.29.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.29.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.3.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.3.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.3.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.3.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.3.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.3.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.3.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.3.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.3.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.30.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.30.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.30.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.30.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.30.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.30.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.30.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.30.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.30.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.31.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.31.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.31.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.31.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.31.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.31.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.31.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.31.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.31.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.32.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.32.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.32.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.32.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.32.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.32.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.32.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.32.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.32.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.33.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.33.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.33.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.33.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.33.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.33.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.33.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.33.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.33.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.34.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.34.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.34.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.34.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.34.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.34.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.34.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.34.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.34.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.35.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.35.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.35.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.35.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.35.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.35.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.35.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.35.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.35.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.36.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.36.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.36.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.36.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.36.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.36.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.36.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.36.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.36.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.37.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.37.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.37.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.37.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.37.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.37.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.37.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.37.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.37.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.38.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.38.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.38.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.38.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.38.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.38.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.38.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.38.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.38.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.39.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.39.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.39.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.39.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.39.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.39.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.39.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.39.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.39.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.4.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.4.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.4.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.4.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.4.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.4.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.4.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.4.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.4.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.40.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.40.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.40.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.40.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.40.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.40.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.40.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.40.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.40.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.41.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.41.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.41.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.41.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.41.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.41.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.41.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.41.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.41.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.42.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.42.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.42.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.42.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.42.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.42.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.42.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.42.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.42.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.43.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.43.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.43.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.43.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.43.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.43.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.43.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.43.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.43.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.44.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.44.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.44.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.44.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.44.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.44.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.44.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.44.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.44.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.45.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.45.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.45.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.45.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.45.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.45.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.45.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.45.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.45.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.46.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.46.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.46.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.46.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.46.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.46.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.46.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.46.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.46.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.47.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.47.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.47.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.47.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.47.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.47.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.47.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.47.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.47.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.48.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.48.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.48.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.48.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.48.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.48.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.48.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.48.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.48.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.49.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.49.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.49.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.49.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.49.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.49.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.49.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.49.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.49.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.5.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.5.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.5.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.5.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.5.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.5.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.5.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.5.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.5.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.50.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.50.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.50.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.50.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.50.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.50.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.50.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.50.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.50.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.51.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.51.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.51.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.51.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.51.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.51.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.51.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.51.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.51.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.52.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.52.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.52.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.52.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.52.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.52.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.52.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.52.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.52.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.53.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.53.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.53.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.53.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.53.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.53.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.53.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.53.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.53.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.54.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.54.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.54.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.54.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.54.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.54.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.54.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.54.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.54.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.55.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.55.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.55.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.55.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.55.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.55.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.55.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.55.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.55.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.56.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.56.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.56.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.56.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.56.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.56.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.56.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.56.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.56.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.57.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.57.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.57.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.57.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.57.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.57.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.57.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.57.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.57.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.58.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.58.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.58.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.58.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.58.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.58.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.58.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.58.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.58.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.59.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.59.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.59.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.59.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.59.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.59.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.59.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.59.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.59.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.6.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.6.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.6.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.6.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.6.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.6.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.6.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.6.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.6.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.60.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.60.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.60.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.60.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.60.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.60.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.60.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.60.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.60.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.61.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.61.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.61.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.61.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.61.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.61.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.61.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.61.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.61.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.62.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.62.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.62.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.62.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.62.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.62.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.62.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.62.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.62.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.63.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.63.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.63.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.63.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.63.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.63.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.63.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.63.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.63.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.64.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.64.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.64.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.64.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.64.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.64.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.64.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.64.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.64.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.65.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.65.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.65.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.65.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.65.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.65.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.65.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.65.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.65.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.66.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.66.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.66.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.66.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.66.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.66.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.66.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.66.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.66.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.67.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.67.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.67.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.67.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.67.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.67.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.67.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.67.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.67.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.68.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.68.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.68.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.68.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.68.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.68.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.68.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.68.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.68.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.69.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.69.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.69.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.69.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.69.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.69.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.69.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.69.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.69.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.7.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.7.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.7.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.7.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.7.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.7.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.7.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.7.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.7.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.70.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.70.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.70.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.70.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.70.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.70.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.70.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.70.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.70.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.71.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.71.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.71.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.71.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.71.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.71.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.71.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.71.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.71.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.72.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.72.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.72.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.72.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.72.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.72.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.72.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.72.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.72.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.73.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.73.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.73.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.73.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.73.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.73.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.73.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.73.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.73.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.74.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.74.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.74.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.74.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.74.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.74.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.74.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.74.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.74.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.75.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.75.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.75.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.75.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.75.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.75.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.75.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.75.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.75.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.76.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.76.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.76.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.76.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.76.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.76.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.76.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.76.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.76.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.77.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.77.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.77.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.77.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.77.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.77.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.77.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.77.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.77.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.78.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.78.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.78.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.78.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.78.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.78.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.78.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.78.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.78.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.79.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.79.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.79.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.79.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.79.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.79.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.79.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.79.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.79.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.8.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.8.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.8.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.8.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.8.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.8.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.8.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.8.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.8.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.80.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.80.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.80.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.80.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.80.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.80.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.80.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.80.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.80.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.81.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.81.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.81.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.81.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.81.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.81.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.81.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.81.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.81.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.82.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.82.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.82.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.82.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.82.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.82.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.82.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.82.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.82.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.83.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.83.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.83.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.83.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.83.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.83.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.83.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.83.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.83.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.84.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.84.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.84.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.84.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.84.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.84.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.84.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.84.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.84.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.85.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.85.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.85.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.85.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.85.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.85.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.85.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.85.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.85.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.86.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.86.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.86.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.86.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.86.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.86.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.86.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.86.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.86.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.87.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.87.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.87.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.87.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.87.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.87.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.87.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.87.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.87.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.88.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.88.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.88.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.88.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.88.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.88.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.88.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.88.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.88.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.89.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.89.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.89.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.89.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.89.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.89.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.89.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.89.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.89.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.9.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.9.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.9.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.9.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.9.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.9.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.9.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.9.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.9.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.90.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.90.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.90.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.90.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.90.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.90.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.90.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.90.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.90.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.91.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.91.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.91.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.91.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.91.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.91.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.91.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.91.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.91.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.92.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.92.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.92.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.92.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.92.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.92.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.92.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.92.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.92.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.93.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.93.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.93.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.93.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.93.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.93.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.93.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.93.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.93.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.94.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.94.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.94.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.94.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.94.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.94.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.94.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.94.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.94.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.95.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.95.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.95.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.95.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.95.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.95.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.95.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.95.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.95.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.96.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.96.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.96.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.96.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.96.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.96.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.96.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.96.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.96.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.97.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.97.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.97.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.97.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.97.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.97.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.97.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.97.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.97.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.98.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.98.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.98.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.98.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.98.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.98.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.98.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.98.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.98.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.99.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.99.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.99.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.99.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.99.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.99.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.99.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.experts.99.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.experts.99.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.ffn_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.11.gate.weight": "consolidated-00002-of-00013.safetensors", "layers.11.shared_experts.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.shared_experts.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.shared_experts.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.shared_experts.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.shared_experts.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.shared_experts.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.11.shared_experts.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.11.shared_experts.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.11.shared_experts.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.attention.kv_a_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.12.attention.q_a_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.12.attention.wkv_a_with_mqa.weight": "consolidated-00002-of-00013.safetensors", "layers.12.attention.wkv_b.weight": "consolidated-00002-of-00013.safetensors", "layers.12.attention.wo.weight": "consolidated-00002-of-00013.safetensors", "layers.12.attention.wq_a.weight": "consolidated-00002-of-00013.safetensors", "layers.12.attention.wq_b.weight": "consolidated-00002-of-00013.safetensors", "layers.12.attention_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.12.experts.0.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.0.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.0.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.0.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.0.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.0.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.0.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.0.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.0.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.1.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.1.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.1.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.1.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.1.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.1.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.1.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.1.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.1.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.10.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.10.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.10.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.10.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.10.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.10.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.10.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.10.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.10.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.100.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.100.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.100.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.100.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.100.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.100.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.100.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.100.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.100.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.101.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.101.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.101.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.101.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.101.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.101.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.101.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.101.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.101.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.102.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.102.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.102.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.102.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.102.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.102.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.102.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.102.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.102.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.103.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.103.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.103.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.103.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.103.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.103.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.103.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.103.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.103.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.104.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.104.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.104.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.104.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.104.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.104.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.104.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.104.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.104.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.105.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.105.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.105.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.105.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.105.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.105.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.105.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.105.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.105.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.106.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.106.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.106.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.106.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.106.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.106.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.106.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.106.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.106.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.107.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.107.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.107.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.107.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.107.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.107.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.107.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.107.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.107.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.108.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.108.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.108.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.108.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.108.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.108.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.108.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.108.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.108.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.109.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.109.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.109.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.109.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.109.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.109.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.109.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.109.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.109.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.11.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.11.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.11.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.11.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.11.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.11.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.11.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.11.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.11.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.110.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.110.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.110.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.110.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.110.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.110.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.110.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.110.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.110.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.111.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.111.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.111.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.111.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.111.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.111.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.111.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.111.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.111.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.112.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.112.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.112.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.112.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.112.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.112.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.112.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.112.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.112.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.113.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.113.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.113.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.113.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.113.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.113.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.113.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.113.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.113.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.114.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.114.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.114.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.114.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.114.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.114.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.114.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.114.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.114.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.115.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.115.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.115.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.115.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.115.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.115.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.115.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.115.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.115.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.116.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.116.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.116.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.116.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.116.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.116.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.116.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.116.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.116.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.117.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.117.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.117.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.117.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.117.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.117.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.117.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.117.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.117.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.118.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.118.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.118.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.118.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.118.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.118.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.118.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.118.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.118.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.119.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.119.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.119.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.119.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.119.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.119.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.119.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.119.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.119.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.12.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.12.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.12.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.12.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.12.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.12.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.12.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.12.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.12.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.120.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.120.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.120.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.120.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.120.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.120.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.120.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.120.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.120.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.121.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.121.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.121.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.121.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.121.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.121.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.121.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.121.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.121.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.122.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.122.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.122.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.122.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.122.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.122.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.122.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.122.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.122.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.123.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.123.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.123.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.123.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.123.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.123.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.123.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.123.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.123.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.124.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.124.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.124.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.124.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.124.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.124.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.124.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.124.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.124.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.125.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.125.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.125.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.125.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.125.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.125.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.125.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.125.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.125.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.126.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.126.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.126.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.126.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.126.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.126.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.126.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.126.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.126.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.127.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.127.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.127.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.127.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.127.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.127.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.127.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.127.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.127.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.13.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.13.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.13.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.13.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.13.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.13.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.13.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.13.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.13.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.14.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.14.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.14.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.14.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.14.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.14.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.14.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.14.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.14.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.15.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.15.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.15.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.15.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.15.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.15.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.15.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.15.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.15.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.16.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.16.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.16.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.16.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.16.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.16.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.16.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.16.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.16.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.17.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.17.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.17.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.17.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.17.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.17.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.17.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.17.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.17.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.18.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.18.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.18.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.18.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.18.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.18.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.18.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.18.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.18.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.19.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.19.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.19.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.19.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.19.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.19.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.19.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.19.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.19.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.2.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.2.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.2.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.2.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.2.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.2.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.2.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.2.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.2.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.20.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.20.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.20.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.20.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.20.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.20.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.20.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.20.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.20.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.21.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.21.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.21.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.21.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.21.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.21.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.21.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.21.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.21.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.22.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.22.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.22.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.22.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.22.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.22.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.22.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.22.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.22.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.23.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.23.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.23.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.23.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.23.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.23.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.23.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.23.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.23.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.24.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.24.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.24.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.24.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.24.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.24.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.24.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.24.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.24.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.25.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.25.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.25.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.25.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.25.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.25.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.25.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.25.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.25.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.26.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.26.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.26.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.26.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.26.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.26.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.26.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.26.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.26.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.27.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.27.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.27.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.27.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.27.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.27.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.27.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.27.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.27.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.28.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.28.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.28.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.28.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.28.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.28.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.28.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.28.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.28.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.29.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.29.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.29.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.29.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.29.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.29.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.29.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.29.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.29.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.3.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.3.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.3.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.3.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.3.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.3.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.3.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.3.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.3.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.30.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.30.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.30.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.30.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.30.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.30.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.30.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.30.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.30.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.31.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.31.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.31.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.31.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.31.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.31.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.31.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.31.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.31.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.32.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.32.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.32.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.32.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.32.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.32.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.32.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.32.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.32.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.33.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.33.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.33.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.33.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.33.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.33.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.33.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.33.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.33.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.34.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.34.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.34.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.34.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.34.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.34.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.34.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.34.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.34.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.35.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.35.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.35.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.35.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.35.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.35.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.35.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.35.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.35.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.36.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.36.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.36.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.36.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.36.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.36.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.36.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.36.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.36.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.37.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.37.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.37.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.37.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.37.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.37.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.37.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.37.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.37.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.38.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.38.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.38.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.38.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.38.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.38.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.38.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.38.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.38.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.39.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.39.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.39.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.39.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.39.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.39.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.39.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.39.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.39.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.4.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.4.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.4.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.4.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.4.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.4.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.4.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.4.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.4.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.40.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.40.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.40.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.40.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.40.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.40.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.40.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.40.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.40.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.41.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.41.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.41.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.41.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.41.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.41.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.41.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.41.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.41.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.42.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.42.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.42.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.42.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.42.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.42.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.42.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.42.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.42.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.43.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.43.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.43.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.43.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.43.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.43.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.43.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.43.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.43.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.44.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.44.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.44.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.44.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.44.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.44.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.44.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.44.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.44.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.45.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.45.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.45.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.45.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.45.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.45.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.45.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.45.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.45.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.46.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.46.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.46.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.46.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.46.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.46.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.46.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.46.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.46.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.47.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.47.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.47.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.47.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.47.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.47.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.47.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.47.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.47.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.48.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.48.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.48.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.48.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.48.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.48.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.48.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.48.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.48.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.49.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.49.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.49.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.49.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.49.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.49.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.49.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.49.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.49.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.5.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.5.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.5.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.5.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.5.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.5.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.5.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.5.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.5.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.50.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.50.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.50.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.50.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.50.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.50.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.50.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.50.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.50.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.51.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.51.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.51.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.51.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.51.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.51.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.51.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.51.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.51.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.52.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.52.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.52.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.52.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.52.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.52.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.52.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.52.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.52.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.53.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.53.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.53.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.53.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.53.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.53.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.53.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.53.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.53.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.54.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.54.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.54.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.54.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.54.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.54.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.54.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.54.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.54.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.55.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.55.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.55.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.55.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.55.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.55.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.55.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.55.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.55.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.56.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.56.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.56.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.56.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.56.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.56.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.56.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.56.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.56.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.57.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.57.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.57.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.57.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.57.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.57.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.57.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.57.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.57.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.58.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.58.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.58.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.58.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.58.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.58.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.58.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.58.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.58.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.59.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.59.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.59.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.59.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.59.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.59.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.59.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.59.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.59.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.6.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.6.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.6.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.6.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.6.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.6.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.6.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.6.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.6.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.60.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.60.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.60.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.60.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.60.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.60.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.60.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.60.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.60.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.61.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.61.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.61.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.61.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.61.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.61.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.61.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.61.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.61.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.62.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.62.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.62.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.62.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.62.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.62.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.62.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.62.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.62.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.63.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.63.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.63.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.63.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.63.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.63.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.63.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.63.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.63.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.64.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.64.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.64.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.64.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.64.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.64.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.64.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.64.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.64.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.65.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.65.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.65.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.65.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.65.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.65.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.65.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.65.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.65.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.66.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.66.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.66.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.66.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.66.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.66.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.66.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.66.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.66.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.67.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.67.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.67.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.67.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.67.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.67.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.67.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.67.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.67.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.68.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.68.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.68.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.68.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.68.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.68.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.68.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.68.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.68.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.69.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.69.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.69.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.69.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.69.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.69.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.69.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.69.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.69.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.7.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.7.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.7.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.7.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.7.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.7.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.7.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.7.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.7.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.70.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.70.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.70.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.70.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.70.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.70.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.70.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.70.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.70.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.71.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.71.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.71.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.71.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.71.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.71.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.71.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.71.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.71.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.72.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.72.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.72.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.72.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.72.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.72.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.72.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.72.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.72.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.73.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.73.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.73.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.73.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.73.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.73.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.73.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.73.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.73.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.74.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.74.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.74.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.74.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.74.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.74.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.74.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.74.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.74.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.75.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.75.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.75.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.75.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.75.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.75.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.75.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.75.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.75.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.76.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.76.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.76.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.76.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.76.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.76.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.76.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.76.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.76.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.77.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.77.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.77.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.77.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.77.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.77.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.77.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.77.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.77.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.78.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.78.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.78.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.78.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.78.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.78.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.78.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.78.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.78.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.79.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.79.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.79.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.79.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.79.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.79.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.79.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.79.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.79.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.8.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.8.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.8.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.8.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.8.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.8.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.8.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.8.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.8.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.80.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.80.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.80.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.80.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.80.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.80.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.80.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.80.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.80.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.81.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.81.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.81.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.81.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.81.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.81.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.81.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.81.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.81.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.82.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.82.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.82.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.82.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.82.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.82.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.82.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.82.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.82.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.83.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.83.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.83.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.83.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.83.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.83.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.83.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.83.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.83.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.84.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.84.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.84.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.84.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.84.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.84.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.84.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.84.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.84.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.85.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.85.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.85.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.85.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.85.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.85.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.85.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.85.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.85.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.86.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.86.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.86.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.86.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.86.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.86.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.86.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.86.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.86.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.87.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.87.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.87.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.87.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.87.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.87.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.87.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.87.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.87.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.88.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.88.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.88.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.88.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.88.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.88.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.88.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.88.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.88.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.89.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.89.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.89.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.89.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.89.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.89.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.89.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.89.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.89.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.9.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.9.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.9.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.9.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.9.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.9.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.9.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.9.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.9.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.90.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.90.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.90.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.90.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.90.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.90.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.90.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.90.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.90.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.91.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.91.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.91.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.91.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.91.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.91.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.91.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.91.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.91.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.92.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.92.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.92.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.92.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.92.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.92.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.92.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.92.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.92.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.93.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.93.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.93.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.93.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.93.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.93.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.93.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.93.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.93.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.94.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.94.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.94.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.94.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.94.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.94.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.94.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.94.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.94.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.95.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.95.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.95.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.95.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.95.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.95.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.95.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.95.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.95.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.96.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.96.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.96.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.96.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.96.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.96.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.96.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.96.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.96.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.97.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.97.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.97.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.97.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.97.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.97.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.97.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.97.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.97.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.98.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.98.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.98.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.98.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.98.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.98.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.98.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.98.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.98.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.99.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.99.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.99.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.99.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.99.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.99.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.99.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.experts.99.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.experts.99.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.ffn_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.12.gate.weight": "consolidated-00002-of-00013.safetensors", "layers.12.shared_experts.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.shared_experts.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.shared_experts.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.shared_experts.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.shared_experts.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.shared_experts.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.12.shared_experts.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.12.shared_experts.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.12.shared_experts.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.attention.kv_a_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.13.attention.q_a_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.13.attention.wkv_a_with_mqa.weight": "consolidated-00002-of-00013.safetensors", "layers.13.attention.wkv_b.weight": "consolidated-00002-of-00013.safetensors", "layers.13.attention.wo.weight": "consolidated-00002-of-00013.safetensors", "layers.13.attention.wq_a.weight": "consolidated-00002-of-00013.safetensors", "layers.13.attention.wq_b.weight": "consolidated-00002-of-00013.safetensors", "layers.13.attention_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.13.experts.0.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.0.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.0.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.0.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.0.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.0.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.0.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.0.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.0.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.1.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.1.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.1.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.1.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.1.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.1.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.1.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.1.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.1.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.10.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.10.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.10.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.10.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.10.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.10.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.10.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.10.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.10.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.100.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.100.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.100.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.100.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.100.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.100.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.100.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.100.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.100.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.101.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.101.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.101.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.101.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.101.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.101.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.101.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.101.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.101.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.102.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.102.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.102.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.102.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.102.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.102.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.102.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.102.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.102.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.103.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.103.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.103.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.103.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.103.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.103.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.103.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.103.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.103.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.104.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.104.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.104.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.104.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.104.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.104.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.104.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.104.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.104.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.105.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.105.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.105.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.105.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.105.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.105.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.105.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.105.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.105.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.106.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.106.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.106.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.106.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.106.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.106.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.106.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.106.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.106.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.107.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.107.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.107.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.107.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.107.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.107.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.107.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.107.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.107.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.108.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.108.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.108.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.108.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.108.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.108.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.108.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.108.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.108.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.109.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.109.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.109.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.109.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.109.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.109.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.109.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.109.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.109.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.11.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.11.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.11.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.11.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.11.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.11.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.11.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.11.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.11.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.110.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.110.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.110.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.110.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.110.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.110.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.110.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.110.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.110.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.111.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.111.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.111.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.111.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.111.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.111.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.111.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.111.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.111.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.112.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.112.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.112.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.112.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.112.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.112.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.112.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.112.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.112.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.113.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.113.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.113.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.113.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.113.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.113.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.113.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.113.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.113.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.114.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.114.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.114.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.114.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.114.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.114.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.114.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.114.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.114.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.115.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.115.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.115.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.115.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.115.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.115.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.115.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.115.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.115.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.116.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.116.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.116.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.116.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.116.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.116.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.116.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.116.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.116.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.117.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.117.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.117.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.117.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.117.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.117.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.117.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.117.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.117.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.118.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.118.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.118.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.118.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.118.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.118.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.118.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.118.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.118.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.119.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.119.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.119.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.119.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.119.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.119.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.119.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.119.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.119.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.12.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.12.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.12.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.12.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.12.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.12.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.12.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.12.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.12.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.120.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.120.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.120.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.120.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.120.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.120.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.120.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.120.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.120.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.121.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.121.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.121.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.121.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.121.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.121.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.121.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.121.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.121.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.122.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.122.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.122.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.122.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.122.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.122.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.122.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.122.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.122.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.123.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.123.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.123.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.123.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.123.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.123.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.123.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.123.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.123.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.124.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.124.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.124.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.124.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.124.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.124.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.124.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.124.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.124.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.125.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.125.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.125.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.125.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.125.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.125.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.125.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.125.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.125.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.126.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.126.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.126.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.126.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.126.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.126.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.126.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.126.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.126.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.127.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.127.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.127.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.127.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.127.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.127.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.127.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.127.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.127.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.13.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.13.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.13.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.13.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.13.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.13.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.13.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.13.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.13.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.14.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.14.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.14.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.14.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.14.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.14.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.14.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.14.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.14.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.15.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.15.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.15.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.15.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.15.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.15.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.15.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.15.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.15.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.16.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.16.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.16.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.16.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.16.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.16.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.16.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.16.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.16.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.17.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.17.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.17.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.17.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.17.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.17.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.17.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.17.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.17.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.18.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.18.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.18.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.18.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.18.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.18.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.18.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.18.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.18.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.19.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.19.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.19.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.19.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.19.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.19.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.19.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.19.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.19.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.2.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.2.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.2.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.2.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.2.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.2.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.2.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.2.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.2.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.20.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.20.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.20.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.20.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.20.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.20.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.20.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.20.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.20.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.21.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.21.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.21.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.21.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.21.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.21.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.21.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.21.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.21.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.22.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.22.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.22.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.22.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.22.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.22.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.22.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.22.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.22.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.23.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.23.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.23.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.23.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.23.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.23.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.23.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.23.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.23.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.24.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.24.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.24.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.24.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.24.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.24.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.24.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.24.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.24.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.25.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.25.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.25.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.25.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.25.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.25.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.25.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.25.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.25.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.26.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.26.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.26.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.26.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.26.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.26.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.26.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.26.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.26.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.27.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.27.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.27.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.27.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.27.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.27.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.27.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.27.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.27.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.28.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.28.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.28.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.28.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.28.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.28.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.28.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.28.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.28.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.29.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.29.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.29.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.29.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.29.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.29.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.29.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.29.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.29.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.3.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.3.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.3.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.3.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.3.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.3.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.3.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.3.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.3.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.30.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.30.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.30.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.30.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.30.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.30.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.30.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.30.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.30.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.31.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.31.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.31.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.31.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.31.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.31.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.31.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.31.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.31.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.32.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.32.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.32.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.32.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.32.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.32.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.32.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.32.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.32.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.33.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.33.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.33.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.33.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.33.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.33.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.33.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.33.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.33.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.34.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.34.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.34.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.34.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.34.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.34.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.34.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.34.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.34.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.35.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.35.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.35.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.35.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.35.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.35.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.35.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.35.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.35.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.36.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.36.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.36.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.36.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.36.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.36.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.36.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.36.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.36.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.37.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.37.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.37.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.37.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.37.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.37.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.37.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.37.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.37.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.38.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.38.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.38.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.38.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.38.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.38.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.38.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.38.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.38.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.39.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.39.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.39.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.39.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.39.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.39.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.39.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.39.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.39.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.4.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.4.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.4.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.4.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.4.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.4.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.4.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.4.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.4.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.40.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.40.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.40.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.40.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.40.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.40.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.40.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.40.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.40.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.41.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.41.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.41.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.41.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.41.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.41.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.41.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.41.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.41.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.42.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.42.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.42.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.42.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.42.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.42.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.42.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.42.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.42.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.43.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.43.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.43.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.43.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.43.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.43.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.43.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.43.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.43.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.44.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.44.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.44.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.44.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.44.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.44.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.44.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.44.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.44.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.45.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.45.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.45.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.45.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.45.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.45.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.45.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.45.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.45.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.46.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.46.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.46.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.46.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.46.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.46.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.46.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.46.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.46.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.47.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.47.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.47.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.47.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.47.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.47.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.47.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.47.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.47.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.48.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.48.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.48.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.48.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.48.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.48.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.48.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.48.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.48.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.49.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.49.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.49.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.49.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.49.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.49.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.49.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.49.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.49.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.5.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.5.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.5.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.5.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.5.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.5.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.5.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.5.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.5.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.50.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.50.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.50.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.50.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.50.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.50.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.50.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.50.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.50.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.51.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.51.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.51.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.51.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.51.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.51.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.51.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.51.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.51.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.52.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.52.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.52.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.52.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.52.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.52.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.52.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.52.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.52.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.53.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.53.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.53.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.53.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.53.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.53.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.53.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.53.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.53.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.54.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.54.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.54.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.54.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.54.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.54.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.54.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.54.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.54.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.55.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.55.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.55.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.55.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.55.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.55.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.55.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.55.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.55.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.56.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.56.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.56.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.56.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.56.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.56.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.56.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.56.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.56.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.57.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.57.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.57.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.57.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.57.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.57.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.57.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.57.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.57.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.58.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.58.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.58.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.58.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.58.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.58.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.58.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.58.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.58.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.59.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.59.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.59.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.59.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.59.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.59.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.59.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.59.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.59.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.6.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.6.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.6.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.6.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.6.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.6.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.6.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.6.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.6.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.60.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.60.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.60.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.60.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.60.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.60.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.60.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.60.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.60.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.61.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.61.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.61.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.61.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.61.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.61.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.61.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.61.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.61.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.62.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.62.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.62.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.62.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.62.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.62.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.62.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.62.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.62.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.63.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.63.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.63.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.63.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.63.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.63.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.63.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.63.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.63.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.64.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.64.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.64.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.64.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.64.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.64.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.64.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.64.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.64.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.65.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.65.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.65.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.65.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.65.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.65.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.65.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.65.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.65.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.66.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.66.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.66.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.66.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.66.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.66.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.66.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.66.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.66.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.67.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.67.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.67.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.67.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.67.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.67.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.67.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.67.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.67.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.68.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.68.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.68.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.68.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.68.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.68.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.68.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.68.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.68.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.69.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.69.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.69.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.69.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.69.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.69.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.69.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.69.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.69.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.7.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.7.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.7.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.7.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.7.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.7.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.7.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.7.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.7.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.70.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.70.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.70.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.70.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.70.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.70.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.70.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.70.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.70.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.71.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.71.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.71.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.71.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.71.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.71.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.71.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.71.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.71.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.72.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.72.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.72.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.72.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.72.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.72.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.72.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.72.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.72.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.73.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.73.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.73.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.73.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.73.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.73.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.73.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.73.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.73.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.74.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.74.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.74.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.74.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.74.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.74.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.74.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.74.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.74.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.75.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.75.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.75.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.75.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.75.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.75.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.75.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.75.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.75.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.76.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.76.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.76.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.76.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.76.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.76.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.76.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.76.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.76.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.77.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.77.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.77.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.77.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.77.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.77.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.77.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.77.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.77.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.78.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.78.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.78.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.78.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.78.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.78.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.78.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.78.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.78.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.79.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.79.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.79.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.79.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.79.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.79.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.79.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.79.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.79.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.8.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.8.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.8.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.8.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.8.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.8.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.8.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.8.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.8.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.80.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.80.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.80.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.80.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.80.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.80.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.80.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.80.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.80.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.81.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.81.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.81.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.81.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.81.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.81.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.81.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.81.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.81.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.82.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.82.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.82.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.82.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.82.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.82.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.82.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.82.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.82.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.83.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.83.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.83.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.83.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.83.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.83.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.83.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.83.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.83.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.84.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.84.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.84.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.84.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.84.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.84.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.84.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.84.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.84.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.85.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.85.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.85.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.85.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.85.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.85.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.85.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.85.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.85.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.86.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.86.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.86.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.86.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.86.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.86.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.86.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.86.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.86.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.87.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.87.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.87.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.87.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.87.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.87.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.87.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.87.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.87.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.88.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.88.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.88.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.88.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.88.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.88.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.88.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.88.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.88.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.89.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.89.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.89.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.89.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.89.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.89.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.89.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.89.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.89.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.9.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.9.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.9.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.9.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.9.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.9.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.9.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.9.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.9.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.90.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.90.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.90.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.90.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.90.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.90.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.90.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.90.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.90.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.91.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.91.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.91.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.91.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.91.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.91.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.91.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.91.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.91.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.92.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.92.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.92.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.92.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.92.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.92.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.92.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.92.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.92.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.93.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.93.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.93.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.93.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.93.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.93.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.93.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.93.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.93.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.94.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.94.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.94.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.94.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.94.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.94.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.94.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.94.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.94.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.95.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.95.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.95.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.95.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.95.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.95.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.95.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.95.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.95.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.96.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.96.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.96.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.96.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.96.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.96.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.96.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.96.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.96.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.97.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.97.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.97.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.97.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.97.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.97.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.97.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.97.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.97.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.98.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.98.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.98.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.98.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.98.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.98.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.98.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.98.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.98.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.99.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.99.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.99.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.99.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.99.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.99.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.99.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.experts.99.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.experts.99.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.ffn_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.13.gate.weight": "consolidated-00002-of-00013.safetensors", "layers.13.shared_experts.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.shared_experts.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.shared_experts.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.shared_experts.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.shared_experts.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.shared_experts.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.13.shared_experts.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.13.shared_experts.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.13.shared_experts.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.attention.kv_a_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.14.attention.q_a_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.14.attention.wkv_a_with_mqa.weight": "consolidated-00002-of-00013.safetensors", "layers.14.attention.wkv_b.weight": "consolidated-00002-of-00013.safetensors", "layers.14.attention.wo.weight": "consolidated-00002-of-00013.safetensors", "layers.14.attention.wq_a.weight": "consolidated-00002-of-00013.safetensors", "layers.14.attention.wq_b.weight": "consolidated-00002-of-00013.safetensors", "layers.14.attention_norm.weight": "consolidated-00002-of-00013.safetensors", "layers.14.experts.0.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.0.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.0.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.0.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.0.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.0.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.0.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.0.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.0.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.1.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.1.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.1.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.1.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.1.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.1.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.1.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.1.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.1.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.10.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.10.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.10.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.10.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.10.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.10.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.10.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.10.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.10.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.100.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.100.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.100.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.100.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.100.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.100.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.100.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.100.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.100.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.101.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.101.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.101.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.101.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.101.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.101.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.101.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.101.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.101.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.102.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.102.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.102.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.102.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.102.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.102.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.102.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.102.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.102.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.103.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.103.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.103.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.103.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.103.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.103.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.103.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.103.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.103.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.104.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.104.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.104.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.104.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.104.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.104.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.104.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.104.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.104.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.105.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.105.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.105.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.105.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.105.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.105.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.105.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.105.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.105.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.106.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.106.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.106.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.106.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.106.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.106.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.106.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.106.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.106.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.107.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.107.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.107.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.107.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.107.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.107.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.107.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.107.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.107.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.108.w1.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.108.w1.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.108.w1.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.108.w2.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.108.w2.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.108.w2.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.108.w3.weight_global_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.108.w3.weight_packed": "consolidated-00002-of-00013.safetensors", "layers.14.experts.108.w3.weight_scale": "consolidated-00002-of-00013.safetensors", "layers.14.experts.109.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.109.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.109.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.109.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.109.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.109.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.109.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.109.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.109.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.11.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.11.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.11.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.11.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.11.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.11.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.11.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.11.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.11.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.110.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.110.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.110.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.110.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.110.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.110.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.110.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.110.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.110.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.111.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.111.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.111.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.111.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.111.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.111.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.111.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.111.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.111.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.112.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.112.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.112.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.112.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.112.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.112.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.112.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.112.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.112.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.113.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.113.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.113.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.113.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.113.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.113.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.113.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.113.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.113.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.114.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.114.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.114.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.114.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.114.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.114.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.114.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.114.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.114.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.115.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.115.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.115.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.115.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.115.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.115.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.115.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.115.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.115.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.116.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.116.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.116.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.116.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.116.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.116.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.116.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.116.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.116.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.117.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.117.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.117.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.117.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.117.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.117.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.117.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.117.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.117.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.118.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.118.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.118.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.118.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.118.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.118.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.118.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.118.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.118.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.119.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.119.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.119.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.119.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.119.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.119.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.119.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.119.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.119.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.12.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.12.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.12.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.12.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.12.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.12.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.12.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.12.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.12.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.120.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.120.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.120.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.120.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.120.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.120.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.120.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.120.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.120.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.121.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.121.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.121.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.121.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.121.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.121.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.121.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.121.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.121.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.122.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.122.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.122.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.122.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.122.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.122.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.122.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.122.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.122.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.123.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.123.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.123.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.123.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.123.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.123.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.123.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.123.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.123.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.124.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.124.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.124.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.124.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.124.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.124.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.124.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.124.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.124.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.125.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.125.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.125.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.125.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.125.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.125.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.125.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.125.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.125.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.126.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.126.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.126.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.126.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.126.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.126.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.126.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.126.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.126.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.127.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.127.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.127.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.127.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.127.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.127.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.127.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.127.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.127.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.13.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.13.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.13.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.13.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.13.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.13.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.13.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.13.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.13.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.14.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.14.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.14.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.14.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.14.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.14.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.14.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.14.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.14.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.15.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.15.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.15.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.15.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.15.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.15.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.15.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.15.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.15.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.16.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.16.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.16.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.16.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.16.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.16.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.16.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.16.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.16.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.17.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.17.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.17.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.17.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.17.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.17.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.17.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.17.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.17.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.18.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.18.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.18.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.18.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.18.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.18.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.18.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.18.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.18.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.19.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.19.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.19.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.19.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.19.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.19.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.19.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.19.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.19.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.2.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.2.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.2.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.2.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.2.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.2.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.2.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.2.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.2.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.20.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.20.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.20.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.20.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.20.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.20.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.20.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.20.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.20.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.21.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.21.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.21.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.21.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.21.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.21.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.21.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.21.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.21.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.22.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.22.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.22.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.22.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.22.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.22.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.22.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.22.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.22.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.23.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.23.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.23.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.23.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.23.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.23.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.23.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.23.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.23.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.24.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.24.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.24.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.24.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.24.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.24.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.24.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.24.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.24.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.25.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.25.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.25.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.25.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.25.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.25.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.25.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.25.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.25.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.26.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.26.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.26.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.26.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.26.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.26.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.26.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.26.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.26.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.27.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.27.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.27.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.27.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.27.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.27.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.27.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.27.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.27.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.28.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.28.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.28.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.28.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.28.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.28.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.28.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.28.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.28.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.29.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.29.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.29.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.29.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.29.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.29.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.29.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.29.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.29.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.3.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.3.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.3.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.3.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.3.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.3.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.3.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.3.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.3.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.30.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.30.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.30.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.30.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.30.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.30.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.30.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.30.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.30.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.31.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.31.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.31.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.31.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.31.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.31.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.31.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.31.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.31.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.32.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.32.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.32.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.32.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.32.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.32.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.32.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.32.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.32.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.33.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.33.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.33.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.33.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.33.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.33.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.33.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.33.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.33.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.34.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.34.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.34.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.34.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.34.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.34.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.34.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.34.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.34.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.35.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.35.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.35.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.35.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.35.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.35.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.35.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.35.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.35.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.36.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.36.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.36.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.36.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.36.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.36.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.36.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.36.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.36.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.37.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.37.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.37.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.37.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.37.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.37.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.37.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.37.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.37.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.38.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.38.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.38.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.38.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.38.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.38.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.38.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.38.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.38.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.39.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.39.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.39.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.39.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.39.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.39.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.39.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.39.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.39.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.4.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.4.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.4.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.4.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.4.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.4.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.4.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.4.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.4.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.40.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.40.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.40.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.40.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.40.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.40.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.40.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.40.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.40.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.41.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.41.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.41.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.41.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.41.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.41.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.41.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.41.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.41.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.42.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.42.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.42.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.42.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.42.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.42.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.42.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.42.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.42.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.43.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.43.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.43.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.43.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.43.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.43.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.43.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.43.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.43.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.44.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.44.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.44.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.44.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.44.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.44.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.44.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.44.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.44.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.45.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.45.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.45.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.45.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.45.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.45.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.45.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.45.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.45.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.46.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.46.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.46.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.46.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.46.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.46.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.46.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.46.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.46.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.47.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.47.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.47.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.47.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.47.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.47.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.47.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.47.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.47.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.48.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.48.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.48.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.48.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.48.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.48.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.48.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.48.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.48.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.49.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.49.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.49.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.49.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.49.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.49.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.49.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.49.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.49.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.5.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.5.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.5.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.5.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.5.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.5.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.5.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.5.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.5.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.50.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.50.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.50.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.50.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.50.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.50.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.50.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.50.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.50.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.51.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.51.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.51.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.51.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.51.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.51.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.51.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.51.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.51.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.52.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.52.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.52.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.52.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.52.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.52.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.52.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.52.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.52.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.53.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.53.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.53.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.53.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.53.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.53.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.53.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.53.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.53.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.54.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.54.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.54.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.54.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.54.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.54.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.54.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.54.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.54.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.55.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.55.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.55.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.55.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.55.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.55.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.55.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.55.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.55.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.56.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.56.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.56.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.56.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.56.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.56.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.56.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.56.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.56.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.57.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.57.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.57.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.57.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.57.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.57.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.57.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.57.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.57.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.58.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.58.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.58.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.58.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.58.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.58.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.58.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.58.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.58.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.59.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.59.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.59.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.59.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.59.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.59.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.59.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.59.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.59.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.6.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.6.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.6.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.6.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.6.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.6.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.6.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.6.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.6.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.60.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.60.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.60.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.60.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.60.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.60.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.60.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.60.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.60.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.61.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.61.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.61.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.61.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.61.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.61.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.61.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.61.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.61.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.62.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.62.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.62.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.62.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.62.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.62.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.62.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.62.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.62.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.63.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.63.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.63.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.63.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.63.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.63.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.63.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.63.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.63.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.64.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.64.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.64.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.64.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.64.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.64.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.64.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.64.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.64.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.65.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.65.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.65.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.65.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.65.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.65.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.65.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.65.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.65.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.66.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.66.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.66.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.66.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.66.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.66.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.66.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.66.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.66.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.67.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.67.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.67.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.67.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.67.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.67.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.67.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.67.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.67.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.68.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.68.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.68.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.68.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.68.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.68.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.68.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.68.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.68.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.69.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.69.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.69.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.69.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.69.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.69.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.69.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.69.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.69.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.7.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.7.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.7.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.7.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.7.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.7.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.7.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.7.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.7.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.70.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.70.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.70.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.70.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.70.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.70.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.70.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.70.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.70.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.71.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.71.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.71.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.71.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.71.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.71.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.71.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.71.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.71.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.72.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.72.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.72.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.72.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.72.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.72.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.72.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.72.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.72.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.73.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.73.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.73.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.73.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.73.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.73.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.73.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.73.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.73.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.74.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.74.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.74.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.74.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.74.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.74.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.74.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.74.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.74.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.75.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.75.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.75.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.75.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.75.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.75.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.75.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.75.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.75.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.76.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.76.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.76.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.76.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.76.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.76.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.76.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.76.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.76.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.77.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.77.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.77.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.77.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.77.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.77.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.77.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.77.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.77.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.78.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.78.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.78.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.78.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.78.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.78.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.78.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.78.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.78.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.79.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.79.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.79.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.79.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.79.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.79.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.79.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.79.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.79.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.8.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.8.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.8.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.8.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.8.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.8.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.8.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.8.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.8.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.80.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.80.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.80.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.80.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.80.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.80.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.80.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.80.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.80.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.81.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.81.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.81.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.81.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.81.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.81.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.81.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.81.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.81.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.82.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.82.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.82.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.82.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.82.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.82.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.82.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.82.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.82.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.83.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.83.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.83.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.83.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.83.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.83.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.83.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.83.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.83.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.84.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.84.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.84.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.84.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.84.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.84.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.84.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.84.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.84.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.85.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.85.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.85.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.85.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.85.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.85.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.85.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.85.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.85.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.86.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.86.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.86.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.86.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.86.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.86.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.86.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.86.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.86.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.87.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.87.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.87.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.87.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.87.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.87.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.87.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.87.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.87.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.88.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.88.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.88.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.88.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.88.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.88.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.88.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.88.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.88.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.89.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.89.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.89.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.89.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.89.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.89.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.89.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.89.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.89.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.9.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.9.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.9.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.9.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.9.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.9.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.9.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.9.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.9.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.90.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.90.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.90.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.90.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.90.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.90.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.90.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.90.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.90.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.91.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.91.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.91.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.91.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.91.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.91.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.91.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.91.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.91.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.92.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.92.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.92.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.92.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.92.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.92.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.92.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.92.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.92.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.93.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.93.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.93.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.93.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.93.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.93.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.93.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.93.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.93.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.94.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.94.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.94.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.94.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.94.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.94.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.94.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.94.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.94.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.95.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.95.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.95.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.95.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.95.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.95.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.95.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.95.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.95.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.96.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.96.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.96.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.96.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.96.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.96.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.96.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.96.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.96.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.97.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.97.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.97.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.97.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.97.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.97.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.97.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.97.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.97.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.98.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.98.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.98.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.98.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.98.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.98.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.98.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.98.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.98.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.99.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.99.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.99.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.99.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.99.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.99.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.99.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.experts.99.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.experts.99.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.ffn_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.14.gate.weight": "consolidated-00003-of-00013.safetensors", "layers.14.shared_experts.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.shared_experts.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.shared_experts.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.shared_experts.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.shared_experts.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.shared_experts.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.14.shared_experts.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.14.shared_experts.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.14.shared_experts.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.attention.kv_a_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.15.attention.q_a_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.15.attention.wkv_a_with_mqa.weight": "consolidated-00003-of-00013.safetensors", "layers.15.attention.wkv_b.weight": "consolidated-00003-of-00013.safetensors", "layers.15.attention.wo.weight": "consolidated-00003-of-00013.safetensors", "layers.15.attention.wq_a.weight": "consolidated-00003-of-00013.safetensors", "layers.15.attention.wq_b.weight": "consolidated-00003-of-00013.safetensors", "layers.15.attention_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.15.experts.0.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.0.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.0.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.0.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.0.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.0.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.0.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.0.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.0.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.1.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.1.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.1.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.1.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.1.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.1.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.1.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.1.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.1.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.10.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.10.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.10.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.10.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.10.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.10.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.10.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.10.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.10.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.100.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.100.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.100.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.100.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.100.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.100.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.100.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.100.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.100.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.101.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.101.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.101.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.101.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.101.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.101.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.101.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.101.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.101.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.102.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.102.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.102.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.102.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.102.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.102.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.102.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.102.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.102.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.103.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.103.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.103.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.103.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.103.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.103.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.103.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.103.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.103.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.104.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.104.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.104.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.104.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.104.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.104.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.104.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.104.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.104.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.105.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.105.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.105.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.105.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.105.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.105.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.105.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.105.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.105.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.106.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.106.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.106.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.106.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.106.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.106.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.106.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.106.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.106.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.107.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.107.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.107.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.107.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.107.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.107.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.107.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.107.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.107.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.108.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.108.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.108.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.108.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.108.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.108.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.108.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.108.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.108.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.109.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.109.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.109.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.109.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.109.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.109.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.109.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.109.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.109.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.11.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.11.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.11.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.11.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.11.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.11.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.11.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.11.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.11.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.110.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.110.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.110.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.110.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.110.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.110.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.110.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.110.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.110.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.111.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.111.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.111.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.111.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.111.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.111.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.111.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.111.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.111.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.112.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.112.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.112.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.112.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.112.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.112.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.112.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.112.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.112.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.113.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.113.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.113.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.113.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.113.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.113.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.113.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.113.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.113.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.114.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.114.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.114.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.114.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.114.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.114.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.114.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.114.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.114.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.115.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.115.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.115.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.115.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.115.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.115.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.115.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.115.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.115.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.116.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.116.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.116.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.116.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.116.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.116.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.116.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.116.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.116.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.117.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.117.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.117.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.117.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.117.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.117.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.117.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.117.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.117.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.118.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.118.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.118.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.118.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.118.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.118.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.118.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.118.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.118.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.119.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.119.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.119.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.119.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.119.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.119.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.119.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.119.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.119.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.12.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.12.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.12.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.12.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.12.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.12.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.12.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.12.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.12.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.120.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.120.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.120.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.120.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.120.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.120.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.120.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.120.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.120.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.121.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.121.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.121.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.121.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.121.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.121.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.121.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.121.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.121.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.122.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.122.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.122.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.122.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.122.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.122.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.122.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.122.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.122.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.123.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.123.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.123.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.123.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.123.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.123.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.123.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.123.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.123.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.124.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.124.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.124.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.124.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.124.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.124.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.124.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.124.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.124.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.125.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.125.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.125.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.125.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.125.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.125.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.125.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.125.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.125.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.126.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.126.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.126.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.126.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.126.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.126.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.126.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.126.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.126.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.127.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.127.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.127.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.127.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.127.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.127.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.127.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.127.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.127.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.13.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.13.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.13.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.13.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.13.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.13.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.13.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.13.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.13.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.14.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.14.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.14.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.14.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.14.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.14.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.14.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.14.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.14.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.15.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.15.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.15.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.15.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.15.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.15.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.15.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.15.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.15.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.16.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.16.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.16.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.16.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.16.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.16.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.16.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.16.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.16.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.17.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.17.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.17.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.17.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.17.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.17.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.17.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.17.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.17.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.18.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.18.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.18.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.18.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.18.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.18.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.18.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.18.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.18.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.19.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.19.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.19.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.19.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.19.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.19.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.19.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.19.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.19.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.2.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.2.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.2.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.2.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.2.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.2.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.2.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.2.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.2.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.20.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.20.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.20.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.20.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.20.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.20.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.20.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.20.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.20.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.21.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.21.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.21.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.21.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.21.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.21.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.21.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.21.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.21.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.22.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.22.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.22.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.22.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.22.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.22.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.22.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.22.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.22.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.23.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.23.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.23.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.23.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.23.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.23.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.23.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.23.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.23.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.24.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.24.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.24.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.24.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.24.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.24.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.24.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.24.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.24.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.25.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.25.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.25.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.25.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.25.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.25.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.25.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.25.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.25.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.26.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.26.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.26.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.26.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.26.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.26.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.26.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.26.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.26.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.27.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.27.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.27.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.27.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.27.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.27.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.27.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.27.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.27.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.28.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.28.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.28.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.28.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.28.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.28.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.28.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.28.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.28.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.29.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.29.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.29.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.29.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.29.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.29.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.29.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.29.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.29.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.3.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.3.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.3.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.3.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.3.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.3.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.3.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.3.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.3.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.30.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.30.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.30.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.30.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.30.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.30.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.30.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.30.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.30.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.31.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.31.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.31.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.31.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.31.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.31.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.31.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.31.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.31.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.32.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.32.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.32.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.32.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.32.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.32.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.32.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.32.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.32.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.33.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.33.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.33.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.33.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.33.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.33.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.33.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.33.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.33.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.34.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.34.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.34.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.34.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.34.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.34.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.34.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.34.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.34.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.35.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.35.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.35.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.35.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.35.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.35.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.35.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.35.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.35.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.36.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.36.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.36.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.36.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.36.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.36.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.36.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.36.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.36.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.37.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.37.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.37.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.37.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.37.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.37.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.37.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.37.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.37.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.38.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.38.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.38.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.38.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.38.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.38.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.38.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.38.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.38.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.39.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.39.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.39.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.39.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.39.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.39.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.39.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.39.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.39.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.4.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.4.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.4.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.4.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.4.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.4.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.4.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.4.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.4.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.40.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.40.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.40.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.40.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.40.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.40.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.40.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.40.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.40.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.41.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.41.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.41.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.41.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.41.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.41.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.41.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.41.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.41.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.42.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.42.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.42.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.42.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.42.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.42.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.42.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.42.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.42.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.43.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.43.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.43.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.43.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.43.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.43.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.43.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.43.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.43.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.44.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.44.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.44.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.44.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.44.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.44.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.44.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.44.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.44.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.45.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.45.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.45.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.45.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.45.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.45.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.45.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.45.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.45.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.46.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.46.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.46.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.46.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.46.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.46.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.46.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.46.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.46.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.47.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.47.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.47.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.47.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.47.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.47.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.47.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.47.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.47.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.48.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.48.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.48.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.48.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.48.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.48.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.48.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.48.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.48.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.49.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.49.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.49.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.49.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.49.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.49.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.49.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.49.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.49.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.5.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.5.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.5.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.5.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.5.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.5.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.5.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.5.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.5.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.50.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.50.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.50.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.50.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.50.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.50.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.50.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.50.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.50.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.51.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.51.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.51.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.51.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.51.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.51.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.51.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.51.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.51.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.52.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.52.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.52.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.52.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.52.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.52.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.52.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.52.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.52.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.53.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.53.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.53.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.53.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.53.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.53.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.53.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.53.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.53.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.54.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.54.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.54.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.54.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.54.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.54.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.54.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.54.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.54.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.55.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.55.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.55.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.55.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.55.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.55.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.55.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.55.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.55.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.56.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.56.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.56.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.56.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.56.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.56.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.56.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.56.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.56.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.57.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.57.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.57.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.57.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.57.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.57.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.57.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.57.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.57.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.58.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.58.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.58.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.58.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.58.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.58.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.58.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.58.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.58.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.59.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.59.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.59.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.59.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.59.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.59.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.59.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.59.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.59.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.6.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.6.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.6.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.6.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.6.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.6.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.6.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.6.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.6.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.60.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.60.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.60.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.60.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.60.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.60.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.60.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.60.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.60.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.61.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.61.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.61.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.61.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.61.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.61.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.61.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.61.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.61.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.62.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.62.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.62.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.62.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.62.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.62.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.62.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.62.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.62.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.63.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.63.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.63.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.63.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.63.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.63.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.63.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.63.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.63.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.64.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.64.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.64.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.64.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.64.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.64.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.64.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.64.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.64.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.65.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.65.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.65.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.65.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.65.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.65.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.65.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.65.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.65.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.66.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.66.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.66.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.66.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.66.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.66.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.66.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.66.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.66.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.67.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.67.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.67.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.67.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.67.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.67.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.67.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.67.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.67.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.68.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.68.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.68.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.68.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.68.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.68.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.68.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.68.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.68.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.69.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.69.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.69.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.69.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.69.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.69.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.69.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.69.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.69.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.7.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.7.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.7.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.7.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.7.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.7.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.7.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.7.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.7.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.70.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.70.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.70.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.70.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.70.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.70.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.70.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.70.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.70.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.71.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.71.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.71.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.71.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.71.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.71.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.71.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.71.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.71.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.72.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.72.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.72.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.72.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.72.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.72.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.72.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.72.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.72.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.73.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.73.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.73.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.73.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.73.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.73.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.73.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.73.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.73.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.74.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.74.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.74.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.74.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.74.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.74.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.74.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.74.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.74.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.75.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.75.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.75.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.75.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.75.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.75.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.75.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.75.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.75.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.76.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.76.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.76.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.76.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.76.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.76.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.76.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.76.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.76.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.77.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.77.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.77.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.77.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.77.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.77.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.77.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.77.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.77.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.78.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.78.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.78.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.78.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.78.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.78.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.78.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.78.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.78.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.79.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.79.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.79.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.79.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.79.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.79.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.79.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.79.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.79.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.8.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.8.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.8.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.8.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.8.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.8.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.8.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.8.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.8.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.80.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.80.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.80.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.80.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.80.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.80.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.80.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.80.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.80.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.81.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.81.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.81.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.81.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.81.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.81.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.81.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.81.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.81.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.82.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.82.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.82.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.82.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.82.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.82.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.82.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.82.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.82.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.83.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.83.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.83.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.83.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.83.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.83.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.83.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.83.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.83.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.84.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.84.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.84.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.84.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.84.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.84.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.84.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.84.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.84.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.85.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.85.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.85.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.85.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.85.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.85.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.85.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.85.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.85.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.86.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.86.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.86.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.86.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.86.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.86.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.86.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.86.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.86.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.87.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.87.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.87.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.87.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.87.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.87.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.87.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.87.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.87.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.88.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.88.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.88.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.88.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.88.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.88.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.88.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.88.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.88.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.89.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.89.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.89.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.89.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.89.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.89.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.89.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.89.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.89.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.9.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.9.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.9.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.9.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.9.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.9.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.9.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.9.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.9.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.90.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.90.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.90.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.90.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.90.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.90.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.90.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.90.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.90.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.91.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.91.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.91.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.91.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.91.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.91.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.91.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.91.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.91.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.92.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.92.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.92.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.92.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.92.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.92.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.92.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.92.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.92.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.93.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.93.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.93.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.93.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.93.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.93.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.93.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.93.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.93.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.94.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.94.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.94.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.94.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.94.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.94.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.94.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.94.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.94.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.95.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.95.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.95.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.95.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.95.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.95.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.95.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.95.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.95.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.96.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.96.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.96.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.96.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.96.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.96.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.96.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.96.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.96.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.97.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.97.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.97.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.97.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.97.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.97.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.97.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.97.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.97.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.98.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.98.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.98.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.98.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.98.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.98.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.98.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.98.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.98.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.99.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.99.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.99.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.99.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.99.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.99.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.99.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.experts.99.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.experts.99.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.ffn_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.15.gate.weight": "consolidated-00003-of-00013.safetensors", "layers.15.shared_experts.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.shared_experts.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.shared_experts.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.shared_experts.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.shared_experts.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.shared_experts.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.15.shared_experts.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.15.shared_experts.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.15.shared_experts.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.attention.kv_a_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.16.attention.q_a_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.16.attention.wkv_a_with_mqa.weight": "consolidated-00003-of-00013.safetensors", "layers.16.attention.wkv_b.weight": "consolidated-00003-of-00013.safetensors", "layers.16.attention.wo.weight": "consolidated-00003-of-00013.safetensors", "layers.16.attention.wq_a.weight": "consolidated-00003-of-00013.safetensors", "layers.16.attention.wq_b.weight": "consolidated-00003-of-00013.safetensors", "layers.16.attention_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.16.experts.0.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.0.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.0.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.0.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.0.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.0.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.0.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.0.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.0.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.1.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.1.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.1.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.1.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.1.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.1.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.1.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.1.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.1.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.10.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.10.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.10.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.10.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.10.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.10.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.10.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.10.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.10.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.100.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.100.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.100.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.100.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.100.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.100.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.100.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.100.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.100.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.101.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.101.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.101.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.101.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.101.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.101.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.101.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.101.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.101.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.102.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.102.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.102.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.102.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.102.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.102.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.102.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.102.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.102.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.103.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.103.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.103.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.103.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.103.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.103.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.103.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.103.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.103.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.104.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.104.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.104.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.104.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.104.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.104.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.104.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.104.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.104.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.105.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.105.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.105.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.105.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.105.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.105.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.105.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.105.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.105.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.106.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.106.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.106.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.106.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.106.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.106.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.106.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.106.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.106.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.107.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.107.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.107.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.107.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.107.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.107.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.107.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.107.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.107.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.108.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.108.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.108.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.108.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.108.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.108.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.108.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.108.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.108.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.109.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.109.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.109.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.109.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.109.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.109.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.109.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.109.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.109.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.11.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.11.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.11.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.11.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.11.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.11.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.11.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.11.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.11.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.110.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.110.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.110.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.110.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.110.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.110.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.110.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.110.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.110.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.111.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.111.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.111.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.111.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.111.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.111.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.111.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.111.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.111.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.112.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.112.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.112.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.112.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.112.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.112.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.112.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.112.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.112.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.113.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.113.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.113.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.113.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.113.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.113.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.113.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.113.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.113.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.114.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.114.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.114.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.114.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.114.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.114.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.114.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.114.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.114.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.115.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.115.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.115.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.115.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.115.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.115.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.115.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.115.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.115.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.116.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.116.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.116.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.116.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.116.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.116.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.116.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.116.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.116.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.117.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.117.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.117.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.117.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.117.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.117.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.117.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.117.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.117.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.118.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.118.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.118.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.118.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.118.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.118.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.118.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.118.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.118.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.119.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.119.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.119.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.119.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.119.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.119.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.119.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.119.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.119.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.12.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.12.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.12.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.12.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.12.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.12.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.12.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.12.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.12.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.120.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.120.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.120.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.120.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.120.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.120.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.120.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.120.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.120.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.121.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.121.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.121.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.121.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.121.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.121.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.121.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.121.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.121.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.122.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.122.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.122.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.122.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.122.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.122.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.122.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.122.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.122.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.123.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.123.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.123.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.123.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.123.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.123.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.123.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.123.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.123.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.124.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.124.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.124.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.124.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.124.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.124.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.124.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.124.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.124.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.125.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.125.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.125.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.125.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.125.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.125.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.125.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.125.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.125.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.126.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.126.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.126.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.126.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.126.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.126.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.126.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.126.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.126.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.127.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.127.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.127.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.127.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.127.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.127.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.127.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.127.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.127.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.13.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.13.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.13.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.13.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.13.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.13.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.13.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.13.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.13.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.14.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.14.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.14.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.14.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.14.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.14.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.14.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.14.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.14.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.15.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.15.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.15.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.15.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.15.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.15.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.15.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.15.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.15.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.16.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.16.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.16.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.16.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.16.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.16.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.16.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.16.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.16.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.17.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.17.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.17.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.17.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.17.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.17.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.17.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.17.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.17.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.18.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.18.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.18.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.18.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.18.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.18.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.18.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.18.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.18.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.19.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.19.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.19.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.19.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.19.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.19.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.19.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.19.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.19.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.2.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.2.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.2.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.2.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.2.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.2.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.2.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.2.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.2.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.20.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.20.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.20.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.20.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.20.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.20.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.20.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.20.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.20.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.21.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.21.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.21.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.21.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.21.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.21.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.21.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.21.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.21.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.22.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.22.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.22.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.22.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.22.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.22.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.22.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.22.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.22.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.23.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.23.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.23.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.23.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.23.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.23.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.23.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.23.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.23.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.24.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.24.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.24.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.24.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.24.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.24.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.24.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.24.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.24.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.25.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.25.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.25.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.25.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.25.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.25.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.25.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.25.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.25.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.26.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.26.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.26.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.26.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.26.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.26.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.26.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.26.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.26.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.27.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.27.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.27.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.27.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.27.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.27.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.27.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.27.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.27.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.28.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.28.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.28.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.28.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.28.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.28.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.28.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.28.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.28.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.29.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.29.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.29.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.29.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.29.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.29.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.29.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.29.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.29.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.3.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.3.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.3.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.3.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.3.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.3.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.3.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.3.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.3.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.30.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.30.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.30.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.30.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.30.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.30.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.30.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.30.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.30.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.31.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.31.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.31.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.31.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.31.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.31.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.31.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.31.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.31.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.32.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.32.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.32.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.32.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.32.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.32.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.32.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.32.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.32.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.33.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.33.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.33.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.33.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.33.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.33.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.33.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.33.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.33.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.34.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.34.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.34.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.34.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.34.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.34.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.34.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.34.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.34.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.35.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.35.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.35.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.35.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.35.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.35.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.35.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.35.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.35.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.36.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.36.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.36.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.36.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.36.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.36.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.36.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.36.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.36.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.37.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.37.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.37.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.37.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.37.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.37.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.37.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.37.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.37.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.38.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.38.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.38.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.38.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.38.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.38.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.38.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.38.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.38.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.39.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.39.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.39.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.39.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.39.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.39.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.39.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.39.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.39.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.4.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.4.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.4.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.4.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.4.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.4.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.4.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.4.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.4.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.40.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.40.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.40.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.40.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.40.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.40.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.40.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.40.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.40.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.41.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.41.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.41.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.41.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.41.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.41.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.41.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.41.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.41.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.42.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.42.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.42.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.42.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.42.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.42.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.42.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.42.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.42.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.43.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.43.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.43.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.43.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.43.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.43.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.43.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.43.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.43.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.44.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.44.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.44.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.44.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.44.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.44.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.44.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.44.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.44.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.45.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.45.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.45.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.45.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.45.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.45.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.45.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.45.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.45.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.46.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.46.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.46.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.46.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.46.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.46.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.46.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.46.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.46.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.47.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.47.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.47.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.47.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.47.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.47.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.47.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.47.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.47.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.48.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.48.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.48.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.48.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.48.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.48.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.48.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.48.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.48.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.49.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.49.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.49.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.49.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.49.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.49.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.49.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.49.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.49.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.5.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.5.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.5.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.5.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.5.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.5.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.5.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.5.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.5.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.50.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.50.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.50.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.50.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.50.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.50.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.50.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.50.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.50.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.51.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.51.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.51.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.51.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.51.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.51.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.51.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.51.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.51.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.52.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.52.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.52.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.52.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.52.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.52.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.52.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.52.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.52.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.53.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.53.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.53.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.53.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.53.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.53.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.53.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.53.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.53.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.54.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.54.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.54.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.54.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.54.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.54.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.54.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.54.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.54.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.55.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.55.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.55.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.55.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.55.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.55.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.55.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.55.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.55.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.56.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.56.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.56.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.56.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.56.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.56.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.56.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.56.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.56.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.57.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.57.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.57.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.57.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.57.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.57.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.57.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.57.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.57.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.58.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.58.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.58.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.58.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.58.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.58.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.58.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.58.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.58.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.59.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.59.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.59.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.59.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.59.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.59.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.59.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.59.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.59.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.6.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.6.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.6.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.6.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.6.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.6.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.6.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.6.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.6.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.60.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.60.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.60.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.60.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.60.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.60.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.60.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.60.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.60.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.61.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.61.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.61.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.61.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.61.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.61.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.61.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.61.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.61.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.62.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.62.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.62.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.62.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.62.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.62.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.62.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.62.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.62.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.63.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.63.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.63.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.63.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.63.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.63.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.63.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.63.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.63.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.64.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.64.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.64.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.64.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.64.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.64.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.64.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.64.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.64.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.65.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.65.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.65.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.65.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.65.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.65.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.65.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.65.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.65.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.66.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.66.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.66.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.66.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.66.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.66.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.66.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.66.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.66.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.67.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.67.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.67.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.67.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.67.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.67.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.67.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.67.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.67.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.68.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.68.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.68.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.68.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.68.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.68.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.68.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.68.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.68.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.69.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.69.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.69.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.69.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.69.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.69.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.69.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.69.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.69.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.7.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.7.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.7.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.7.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.7.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.7.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.7.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.7.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.7.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.70.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.70.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.70.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.70.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.70.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.70.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.70.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.70.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.70.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.71.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.71.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.71.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.71.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.71.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.71.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.71.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.71.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.71.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.72.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.72.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.72.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.72.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.72.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.72.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.72.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.72.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.72.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.73.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.73.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.73.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.73.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.73.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.73.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.73.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.73.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.73.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.74.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.74.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.74.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.74.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.74.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.74.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.74.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.74.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.74.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.75.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.75.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.75.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.75.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.75.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.75.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.75.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.75.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.75.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.76.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.76.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.76.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.76.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.76.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.76.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.76.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.76.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.76.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.77.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.77.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.77.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.77.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.77.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.77.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.77.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.77.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.77.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.78.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.78.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.78.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.78.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.78.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.78.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.78.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.78.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.78.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.79.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.79.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.79.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.79.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.79.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.79.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.79.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.79.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.79.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.8.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.8.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.8.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.8.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.8.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.8.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.8.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.8.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.8.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.80.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.80.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.80.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.80.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.80.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.80.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.80.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.80.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.80.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.81.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.81.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.81.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.81.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.81.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.81.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.81.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.81.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.81.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.82.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.82.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.82.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.82.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.82.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.82.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.82.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.82.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.82.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.83.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.83.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.83.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.83.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.83.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.83.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.83.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.83.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.83.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.84.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.84.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.84.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.84.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.84.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.84.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.84.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.84.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.84.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.85.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.85.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.85.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.85.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.85.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.85.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.85.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.85.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.85.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.86.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.86.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.86.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.86.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.86.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.86.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.86.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.86.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.86.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.87.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.87.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.87.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.87.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.87.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.87.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.87.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.87.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.87.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.88.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.88.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.88.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.88.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.88.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.88.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.88.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.88.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.88.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.89.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.89.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.89.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.89.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.89.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.89.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.89.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.89.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.89.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.9.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.9.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.9.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.9.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.9.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.9.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.9.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.9.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.9.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.90.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.90.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.90.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.90.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.90.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.90.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.90.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.90.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.90.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.91.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.91.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.91.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.91.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.91.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.91.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.91.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.91.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.91.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.92.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.92.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.92.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.92.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.92.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.92.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.92.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.92.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.92.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.93.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.93.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.93.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.93.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.93.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.93.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.93.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.93.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.93.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.94.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.94.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.94.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.94.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.94.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.94.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.94.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.94.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.94.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.95.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.95.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.95.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.95.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.95.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.95.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.95.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.95.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.95.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.96.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.96.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.96.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.96.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.96.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.96.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.96.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.96.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.96.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.97.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.97.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.97.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.97.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.97.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.97.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.97.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.97.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.97.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.98.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.98.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.98.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.98.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.98.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.98.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.98.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.98.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.98.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.99.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.99.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.99.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.99.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.99.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.99.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.99.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.experts.99.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.experts.99.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.ffn_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.16.gate.weight": "consolidated-00003-of-00013.safetensors", "layers.16.shared_experts.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.shared_experts.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.shared_experts.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.shared_experts.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.shared_experts.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.shared_experts.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.16.shared_experts.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.16.shared_experts.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.16.shared_experts.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.attention.kv_a_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.17.attention.q_a_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.17.attention.wkv_a_with_mqa.weight": "consolidated-00003-of-00013.safetensors", "layers.17.attention.wkv_b.weight": "consolidated-00003-of-00013.safetensors", "layers.17.attention.wo.weight": "consolidated-00003-of-00013.safetensors", "layers.17.attention.wq_a.weight": "consolidated-00003-of-00013.safetensors", "layers.17.attention.wq_b.weight": "consolidated-00003-of-00013.safetensors", "layers.17.attention_norm.weight": "consolidated-00003-of-00013.safetensors", "layers.17.experts.0.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.0.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.0.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.0.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.0.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.0.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.0.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.0.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.0.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.1.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.1.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.1.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.1.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.1.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.1.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.1.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.1.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.1.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.10.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.10.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.10.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.10.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.10.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.10.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.10.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.10.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.10.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.100.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.100.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.100.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.100.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.100.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.100.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.100.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.100.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.100.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.101.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.101.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.101.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.101.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.101.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.101.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.101.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.101.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.101.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.102.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.102.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.102.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.102.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.102.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.102.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.102.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.102.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.102.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.103.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.103.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.103.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.103.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.103.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.103.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.103.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.103.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.103.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.104.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.104.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.104.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.104.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.104.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.104.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.104.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.104.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.104.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.105.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.105.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.105.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.105.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.105.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.105.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.105.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.105.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.105.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.106.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.106.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.106.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.106.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.106.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.106.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.106.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.106.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.106.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.107.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.107.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.107.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.107.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.107.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.107.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.107.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.107.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.107.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.108.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.108.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.108.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.108.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.108.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.108.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.108.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.108.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.108.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.109.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.109.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.109.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.109.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.109.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.109.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.109.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.109.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.109.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.11.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.11.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.11.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.11.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.11.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.11.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.11.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.11.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.11.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.110.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.110.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.110.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.110.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.110.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.110.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.110.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.110.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.110.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.111.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.111.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.111.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.111.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.111.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.111.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.111.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.111.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.111.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.112.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.112.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.112.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.112.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.112.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.112.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.112.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.112.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.112.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.113.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.113.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.113.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.113.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.113.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.113.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.113.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.113.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.113.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.114.w1.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.114.w1.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.114.w1.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.114.w2.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.114.w2.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.114.w2.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.114.w3.weight_global_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.114.w3.weight_packed": "consolidated-00003-of-00013.safetensors", "layers.17.experts.114.w3.weight_scale": "consolidated-00003-of-00013.safetensors", "layers.17.experts.115.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.115.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.115.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.115.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.115.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.115.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.115.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.115.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.115.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.116.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.116.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.116.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.116.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.116.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.116.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.116.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.116.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.116.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.117.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.117.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.117.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.117.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.117.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.117.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.117.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.117.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.117.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.118.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.118.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.118.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.118.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.118.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.118.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.118.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.118.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.118.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.119.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.119.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.119.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.119.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.119.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.119.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.119.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.119.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.119.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.12.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.12.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.12.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.12.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.12.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.12.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.12.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.12.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.12.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.120.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.120.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.120.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.120.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.120.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.120.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.120.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.120.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.120.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.121.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.121.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.121.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.121.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.121.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.121.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.121.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.121.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.121.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.122.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.122.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.122.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.122.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.122.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.122.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.122.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.122.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.122.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.123.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.123.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.123.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.123.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.123.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.123.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.123.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.123.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.123.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.124.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.124.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.124.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.124.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.124.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.124.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.124.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.124.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.124.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.125.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.125.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.125.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.125.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.125.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.125.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.125.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.125.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.125.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.126.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.126.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.126.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.126.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.126.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.126.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.126.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.126.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.126.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.127.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.127.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.127.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.127.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.127.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.127.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.127.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.127.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.127.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.13.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.13.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.13.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.13.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.13.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.13.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.13.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.13.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.13.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.14.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.14.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.14.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.14.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.14.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.14.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.14.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.14.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.14.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.15.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.15.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.15.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.15.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.15.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.15.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.15.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.15.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.15.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.16.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.16.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.16.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.16.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.16.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.16.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.16.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.16.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.16.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.17.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.17.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.17.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.17.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.17.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.17.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.17.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.17.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.17.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.18.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.18.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.18.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.18.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.18.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.18.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.18.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.18.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.18.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.19.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.19.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.19.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.19.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.19.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.19.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.19.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.19.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.19.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.2.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.2.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.2.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.2.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.2.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.2.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.2.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.2.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.2.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.20.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.20.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.20.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.20.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.20.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.20.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.20.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.20.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.20.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.21.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.21.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.21.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.21.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.21.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.21.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.21.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.21.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.21.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.22.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.22.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.22.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.22.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.22.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.22.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.22.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.22.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.22.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.23.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.23.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.23.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.23.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.23.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.23.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.23.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.23.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.23.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.24.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.24.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.24.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.24.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.24.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.24.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.24.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.24.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.24.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.25.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.25.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.25.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.25.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.25.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.25.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.25.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.25.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.25.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.26.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.26.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.26.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.26.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.26.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.26.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.26.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.26.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.26.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.27.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.27.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.27.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.27.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.27.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.27.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.27.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.27.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.27.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.28.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.28.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.28.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.28.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.28.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.28.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.28.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.28.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.28.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.29.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.29.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.29.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.29.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.29.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.29.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.29.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.29.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.29.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.3.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.3.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.3.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.3.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.3.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.3.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.3.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.3.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.3.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.30.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.30.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.30.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.30.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.30.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.30.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.30.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.30.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.30.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.31.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.31.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.31.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.31.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.31.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.31.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.31.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.31.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.31.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.32.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.32.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.32.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.32.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.32.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.32.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.32.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.32.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.32.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.33.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.33.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.33.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.33.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.33.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.33.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.33.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.33.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.33.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.34.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.34.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.34.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.34.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.34.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.34.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.34.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.34.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.34.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.35.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.35.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.35.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.35.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.35.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.35.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.35.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.35.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.35.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.36.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.36.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.36.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.36.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.36.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.36.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.36.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.36.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.36.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.37.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.37.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.37.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.37.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.37.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.37.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.37.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.37.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.37.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.38.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.38.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.38.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.38.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.38.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.38.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.38.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.38.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.38.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.39.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.39.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.39.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.39.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.39.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.39.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.39.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.39.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.39.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.4.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.4.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.4.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.4.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.4.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.4.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.4.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.4.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.4.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.40.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.40.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.40.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.40.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.40.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.40.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.40.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.40.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.40.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.41.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.41.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.41.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.41.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.41.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.41.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.41.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.41.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.41.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.42.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.42.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.42.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.42.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.42.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.42.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.42.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.42.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.42.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.43.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.43.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.43.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.43.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.43.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.43.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.43.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.43.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.43.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.44.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.44.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.44.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.44.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.44.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.44.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.44.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.44.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.44.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.45.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.45.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.45.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.45.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.45.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.45.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.45.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.45.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.45.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.46.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.46.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.46.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.46.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.46.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.46.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.46.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.46.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.46.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.47.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.47.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.47.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.47.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.47.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.47.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.47.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.47.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.47.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.48.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.48.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.48.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.48.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.48.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.48.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.48.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.48.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.48.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.49.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.49.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.49.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.49.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.49.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.49.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.49.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.49.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.49.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.5.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.5.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.5.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.5.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.5.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.5.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.5.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.5.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.5.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.50.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.50.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.50.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.50.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.50.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.50.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.50.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.50.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.50.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.51.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.51.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.51.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.51.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.51.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.51.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.51.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.51.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.51.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.52.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.52.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.52.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.52.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.52.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.52.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.52.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.52.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.52.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.53.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.53.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.53.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.53.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.53.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.53.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.53.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.53.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.53.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.54.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.54.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.54.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.54.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.54.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.54.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.54.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.54.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.54.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.55.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.55.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.55.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.55.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.55.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.55.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.55.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.55.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.55.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.56.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.56.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.56.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.56.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.56.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.56.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.56.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.56.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.56.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.57.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.57.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.57.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.57.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.57.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.57.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.57.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.57.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.57.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.58.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.58.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.58.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.58.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.58.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.58.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.58.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.58.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.58.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.59.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.59.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.59.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.59.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.59.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.59.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.59.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.59.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.59.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.6.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.6.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.6.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.6.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.6.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.6.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.6.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.6.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.6.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.60.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.60.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.60.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.60.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.60.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.60.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.60.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.60.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.60.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.61.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.61.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.61.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.61.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.61.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.61.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.61.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.61.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.61.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.62.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.62.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.62.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.62.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.62.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.62.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.62.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.62.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.62.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.63.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.63.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.63.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.63.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.63.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.63.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.63.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.63.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.63.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.64.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.64.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.64.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.64.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.64.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.64.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.64.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.64.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.64.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.65.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.65.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.65.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.65.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.65.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.65.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.65.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.65.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.65.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.66.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.66.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.66.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.66.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.66.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.66.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.66.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.66.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.66.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.67.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.67.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.67.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.67.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.67.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.67.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.67.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.67.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.67.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.68.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.68.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.68.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.68.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.68.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.68.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.68.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.68.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.68.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.69.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.69.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.69.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.69.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.69.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.69.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.69.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.69.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.69.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.7.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.7.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.7.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.7.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.7.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.7.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.7.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.7.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.7.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.70.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.70.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.70.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.70.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.70.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.70.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.70.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.70.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.70.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.71.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.71.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.71.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.71.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.71.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.71.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.71.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.71.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.71.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.72.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.72.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.72.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.72.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.72.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.72.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.72.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.72.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.72.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.73.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.73.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.73.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.73.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.73.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.73.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.73.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.73.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.73.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.74.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.74.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.74.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.74.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.74.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.74.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.74.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.74.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.74.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.75.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.75.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.75.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.75.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.75.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.75.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.75.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.75.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.75.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.76.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.76.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.76.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.76.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.76.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.76.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.76.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.76.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.76.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.77.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.77.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.77.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.77.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.77.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.77.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.77.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.77.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.77.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.78.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.78.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.78.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.78.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.78.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.78.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.78.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.78.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.78.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.79.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.79.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.79.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.79.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.79.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.79.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.79.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.79.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.79.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.8.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.8.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.8.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.8.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.8.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.8.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.8.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.8.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.8.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.80.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.80.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.80.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.80.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.80.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.80.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.80.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.80.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.80.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.81.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.81.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.81.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.81.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.81.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.81.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.81.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.81.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.81.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.82.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.82.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.82.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.82.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.82.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.82.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.82.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.82.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.82.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.83.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.83.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.83.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.83.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.83.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.83.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.83.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.83.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.83.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.84.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.84.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.84.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.84.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.84.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.84.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.84.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.84.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.84.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.85.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.85.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.85.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.85.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.85.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.85.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.85.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.85.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.85.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.86.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.86.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.86.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.86.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.86.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.86.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.86.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.86.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.86.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.87.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.87.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.87.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.87.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.87.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.87.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.87.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.87.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.87.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.88.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.88.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.88.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.88.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.88.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.88.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.88.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.88.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.88.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.89.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.89.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.89.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.89.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.89.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.89.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.89.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.89.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.89.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.9.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.9.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.9.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.9.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.9.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.9.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.9.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.9.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.9.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.90.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.90.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.90.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.90.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.90.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.90.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.90.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.90.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.90.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.91.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.91.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.91.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.91.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.91.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.91.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.91.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.91.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.91.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.92.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.92.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.92.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.92.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.92.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.92.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.92.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.92.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.92.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.93.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.93.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.93.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.93.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.93.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.93.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.93.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.93.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.93.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.94.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.94.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.94.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.94.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.94.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.94.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.94.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.94.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.94.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.95.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.95.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.95.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.95.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.95.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.95.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.95.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.95.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.95.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.96.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.96.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.96.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.96.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.96.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.96.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.96.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.96.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.96.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.97.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.97.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.97.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.97.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.97.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.97.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.97.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.97.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.97.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.98.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.98.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.98.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.98.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.98.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.98.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.98.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.98.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.98.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.99.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.99.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.99.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.99.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.99.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.99.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.99.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.experts.99.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.experts.99.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.ffn_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.17.gate.weight": "consolidated-00004-of-00013.safetensors", "layers.17.shared_experts.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.shared_experts.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.shared_experts.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.shared_experts.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.shared_experts.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.shared_experts.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.17.shared_experts.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.17.shared_experts.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.17.shared_experts.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.attention.kv_a_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.18.attention.q_a_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.18.attention.wkv_a_with_mqa.weight": "consolidated-00004-of-00013.safetensors", "layers.18.attention.wkv_b.weight": "consolidated-00004-of-00013.safetensors", "layers.18.attention.wo.weight": "consolidated-00004-of-00013.safetensors", "layers.18.attention.wq_a.weight": "consolidated-00004-of-00013.safetensors", "layers.18.attention.wq_b.weight": "consolidated-00004-of-00013.safetensors", "layers.18.attention_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.18.experts.0.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.0.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.0.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.0.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.0.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.0.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.0.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.0.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.0.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.1.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.1.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.1.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.1.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.1.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.1.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.1.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.1.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.1.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.10.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.10.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.10.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.10.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.10.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.10.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.10.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.10.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.10.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.100.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.100.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.100.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.100.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.100.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.100.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.100.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.100.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.100.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.101.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.101.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.101.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.101.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.101.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.101.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.101.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.101.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.101.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.102.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.102.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.102.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.102.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.102.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.102.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.102.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.102.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.102.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.103.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.103.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.103.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.103.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.103.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.103.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.103.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.103.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.103.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.104.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.104.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.104.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.104.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.104.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.104.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.104.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.104.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.104.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.105.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.105.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.105.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.105.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.105.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.105.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.105.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.105.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.105.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.106.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.106.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.106.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.106.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.106.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.106.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.106.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.106.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.106.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.107.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.107.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.107.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.107.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.107.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.107.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.107.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.107.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.107.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.108.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.108.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.108.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.108.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.108.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.108.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.108.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.108.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.108.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.109.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.109.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.109.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.109.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.109.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.109.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.109.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.109.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.109.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.11.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.11.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.11.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.11.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.11.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.11.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.11.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.11.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.11.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.110.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.110.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.110.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.110.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.110.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.110.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.110.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.110.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.110.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.111.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.111.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.111.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.111.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.111.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.111.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.111.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.111.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.111.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.112.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.112.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.112.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.112.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.112.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.112.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.112.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.112.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.112.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.113.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.113.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.113.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.113.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.113.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.113.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.113.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.113.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.113.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.114.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.114.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.114.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.114.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.114.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.114.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.114.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.114.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.114.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.115.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.115.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.115.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.115.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.115.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.115.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.115.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.115.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.115.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.116.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.116.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.116.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.116.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.116.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.116.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.116.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.116.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.116.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.117.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.117.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.117.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.117.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.117.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.117.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.117.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.117.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.117.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.118.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.118.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.118.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.118.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.118.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.118.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.118.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.118.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.118.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.119.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.119.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.119.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.119.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.119.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.119.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.119.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.119.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.119.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.12.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.12.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.12.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.12.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.12.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.12.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.12.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.12.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.12.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.120.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.120.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.120.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.120.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.120.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.120.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.120.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.120.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.120.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.121.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.121.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.121.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.121.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.121.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.121.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.121.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.121.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.121.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.122.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.122.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.122.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.122.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.122.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.122.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.122.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.122.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.122.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.123.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.123.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.123.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.123.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.123.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.123.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.123.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.123.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.123.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.124.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.124.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.124.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.124.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.124.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.124.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.124.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.124.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.124.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.125.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.125.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.125.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.125.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.125.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.125.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.125.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.125.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.125.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.126.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.126.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.126.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.126.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.126.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.126.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.126.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.126.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.126.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.127.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.127.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.127.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.127.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.127.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.127.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.127.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.127.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.127.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.13.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.13.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.13.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.13.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.13.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.13.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.13.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.13.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.13.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.14.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.14.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.14.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.14.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.14.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.14.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.14.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.14.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.14.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.15.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.15.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.15.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.15.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.15.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.15.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.15.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.15.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.15.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.16.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.16.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.16.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.16.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.16.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.16.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.16.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.16.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.16.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.17.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.17.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.17.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.17.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.17.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.17.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.17.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.17.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.17.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.18.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.18.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.18.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.18.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.18.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.18.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.18.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.18.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.18.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.19.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.19.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.19.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.19.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.19.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.19.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.19.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.19.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.19.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.2.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.2.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.2.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.2.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.2.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.2.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.2.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.2.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.2.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.20.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.20.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.20.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.20.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.20.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.20.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.20.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.20.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.20.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.21.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.21.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.21.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.21.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.21.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.21.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.21.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.21.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.21.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.22.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.22.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.22.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.22.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.22.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.22.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.22.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.22.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.22.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.23.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.23.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.23.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.23.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.23.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.23.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.23.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.23.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.23.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.24.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.24.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.24.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.24.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.24.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.24.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.24.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.24.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.24.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.25.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.25.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.25.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.25.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.25.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.25.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.25.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.25.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.25.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.26.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.26.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.26.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.26.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.26.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.26.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.26.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.26.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.26.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.27.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.27.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.27.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.27.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.27.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.27.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.27.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.27.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.27.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.28.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.28.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.28.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.28.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.28.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.28.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.28.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.28.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.28.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.29.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.29.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.29.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.29.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.29.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.29.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.29.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.29.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.29.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.3.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.3.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.3.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.3.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.3.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.3.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.3.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.3.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.3.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.30.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.30.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.30.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.30.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.30.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.30.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.30.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.30.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.30.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.31.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.31.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.31.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.31.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.31.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.31.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.31.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.31.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.31.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.32.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.32.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.32.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.32.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.32.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.32.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.32.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.32.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.32.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.33.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.33.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.33.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.33.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.33.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.33.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.33.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.33.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.33.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.34.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.34.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.34.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.34.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.34.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.34.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.34.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.34.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.34.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.35.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.35.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.35.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.35.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.35.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.35.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.35.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.35.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.35.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.36.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.36.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.36.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.36.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.36.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.36.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.36.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.36.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.36.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.37.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.37.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.37.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.37.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.37.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.37.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.37.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.37.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.37.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.38.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.38.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.38.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.38.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.38.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.38.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.38.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.38.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.38.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.39.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.39.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.39.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.39.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.39.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.39.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.39.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.39.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.39.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.4.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.4.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.4.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.4.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.4.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.4.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.4.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.4.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.4.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.40.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.40.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.40.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.40.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.40.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.40.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.40.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.40.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.40.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.41.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.41.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.41.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.41.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.41.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.41.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.41.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.41.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.41.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.42.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.42.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.42.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.42.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.42.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.42.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.42.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.42.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.42.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.43.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.43.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.43.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.43.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.43.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.43.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.43.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.43.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.43.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.44.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.44.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.44.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.44.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.44.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.44.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.44.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.44.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.44.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.45.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.45.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.45.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.45.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.45.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.45.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.45.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.45.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.45.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.46.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.46.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.46.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.46.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.46.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.46.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.46.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.46.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.46.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.47.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.47.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.47.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.47.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.47.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.47.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.47.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.47.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.47.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.48.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.48.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.48.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.48.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.48.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.48.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.48.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.48.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.48.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.49.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.49.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.49.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.49.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.49.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.49.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.49.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.49.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.49.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.5.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.5.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.5.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.5.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.5.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.5.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.5.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.5.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.5.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.50.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.50.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.50.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.50.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.50.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.50.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.50.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.50.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.50.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.51.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.51.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.51.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.51.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.51.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.51.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.51.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.51.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.51.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.52.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.52.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.52.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.52.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.52.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.52.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.52.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.52.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.52.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.53.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.53.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.53.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.53.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.53.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.53.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.53.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.53.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.53.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.54.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.54.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.54.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.54.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.54.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.54.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.54.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.54.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.54.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.55.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.55.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.55.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.55.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.55.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.55.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.55.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.55.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.55.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.56.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.56.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.56.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.56.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.56.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.56.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.56.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.56.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.56.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.57.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.57.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.57.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.57.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.57.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.57.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.57.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.57.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.57.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.58.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.58.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.58.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.58.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.58.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.58.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.58.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.58.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.58.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.59.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.59.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.59.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.59.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.59.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.59.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.59.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.59.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.59.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.6.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.6.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.6.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.6.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.6.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.6.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.6.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.6.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.6.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.60.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.60.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.60.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.60.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.60.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.60.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.60.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.60.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.60.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.61.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.61.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.61.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.61.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.61.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.61.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.61.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.61.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.61.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.62.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.62.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.62.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.62.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.62.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.62.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.62.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.62.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.62.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.63.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.63.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.63.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.63.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.63.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.63.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.63.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.63.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.63.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.64.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.64.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.64.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.64.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.64.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.64.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.64.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.64.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.64.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.65.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.65.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.65.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.65.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.65.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.65.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.65.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.65.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.65.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.66.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.66.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.66.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.66.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.66.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.66.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.66.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.66.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.66.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.67.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.67.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.67.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.67.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.67.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.67.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.67.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.67.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.67.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.68.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.68.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.68.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.68.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.68.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.68.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.68.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.68.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.68.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.69.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.69.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.69.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.69.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.69.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.69.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.69.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.69.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.69.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.7.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.7.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.7.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.7.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.7.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.7.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.7.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.7.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.7.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.70.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.70.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.70.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.70.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.70.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.70.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.70.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.70.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.70.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.71.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.71.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.71.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.71.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.71.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.71.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.71.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.71.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.71.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.72.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.72.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.72.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.72.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.72.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.72.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.72.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.72.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.72.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.73.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.73.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.73.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.73.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.73.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.73.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.73.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.73.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.73.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.74.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.74.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.74.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.74.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.74.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.74.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.74.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.74.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.74.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.75.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.75.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.75.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.75.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.75.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.75.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.75.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.75.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.75.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.76.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.76.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.76.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.76.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.76.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.76.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.76.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.76.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.76.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.77.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.77.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.77.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.77.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.77.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.77.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.77.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.77.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.77.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.78.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.78.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.78.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.78.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.78.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.78.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.78.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.78.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.78.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.79.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.79.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.79.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.79.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.79.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.79.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.79.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.79.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.79.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.8.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.8.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.8.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.8.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.8.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.8.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.8.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.8.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.8.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.80.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.80.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.80.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.80.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.80.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.80.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.80.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.80.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.80.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.81.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.81.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.81.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.81.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.81.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.81.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.81.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.81.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.81.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.82.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.82.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.82.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.82.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.82.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.82.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.82.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.82.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.82.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.83.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.83.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.83.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.83.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.83.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.83.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.83.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.83.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.83.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.84.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.84.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.84.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.84.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.84.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.84.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.84.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.84.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.84.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.85.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.85.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.85.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.85.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.85.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.85.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.85.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.85.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.85.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.86.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.86.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.86.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.86.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.86.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.86.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.86.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.86.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.86.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.87.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.87.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.87.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.87.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.87.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.87.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.87.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.87.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.87.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.88.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.88.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.88.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.88.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.88.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.88.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.88.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.88.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.88.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.89.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.89.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.89.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.89.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.89.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.89.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.89.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.89.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.89.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.9.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.9.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.9.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.9.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.9.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.9.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.9.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.9.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.9.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.90.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.90.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.90.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.90.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.90.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.90.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.90.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.90.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.90.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.91.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.91.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.91.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.91.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.91.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.91.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.91.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.91.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.91.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.92.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.92.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.92.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.92.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.92.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.92.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.92.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.92.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.92.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.93.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.93.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.93.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.93.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.93.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.93.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.93.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.93.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.93.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.94.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.94.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.94.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.94.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.94.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.94.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.94.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.94.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.94.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.95.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.95.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.95.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.95.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.95.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.95.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.95.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.95.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.95.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.96.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.96.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.96.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.96.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.96.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.96.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.96.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.96.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.96.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.97.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.97.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.97.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.97.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.97.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.97.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.97.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.97.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.97.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.98.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.98.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.98.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.98.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.98.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.98.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.98.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.98.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.98.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.99.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.99.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.99.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.99.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.99.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.99.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.99.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.experts.99.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.experts.99.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.ffn_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.18.gate.weight": "consolidated-00004-of-00013.safetensors", "layers.18.shared_experts.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.shared_experts.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.shared_experts.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.shared_experts.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.shared_experts.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.shared_experts.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.18.shared_experts.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.18.shared_experts.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.18.shared_experts.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.attention.kv_a_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.19.attention.q_a_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.19.attention.wkv_a_with_mqa.weight": "consolidated-00004-of-00013.safetensors", "layers.19.attention.wkv_b.weight": "consolidated-00004-of-00013.safetensors", "layers.19.attention.wo.weight": "consolidated-00004-of-00013.safetensors", "layers.19.attention.wq_a.weight": "consolidated-00004-of-00013.safetensors", "layers.19.attention.wq_b.weight": "consolidated-00004-of-00013.safetensors", "layers.19.attention_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.19.experts.0.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.0.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.0.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.0.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.0.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.0.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.0.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.0.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.0.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.1.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.1.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.1.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.1.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.1.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.1.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.1.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.1.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.1.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.10.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.10.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.10.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.10.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.10.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.10.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.10.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.10.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.10.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.100.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.100.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.100.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.100.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.100.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.100.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.100.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.100.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.100.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.101.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.101.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.101.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.101.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.101.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.101.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.101.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.101.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.101.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.102.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.102.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.102.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.102.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.102.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.102.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.102.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.102.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.102.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.103.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.103.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.103.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.103.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.103.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.103.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.103.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.103.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.103.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.104.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.104.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.104.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.104.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.104.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.104.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.104.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.104.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.104.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.105.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.105.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.105.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.105.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.105.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.105.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.105.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.105.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.105.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.106.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.106.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.106.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.106.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.106.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.106.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.106.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.106.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.106.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.107.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.107.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.107.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.107.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.107.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.107.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.107.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.107.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.107.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.108.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.108.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.108.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.108.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.108.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.108.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.108.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.108.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.108.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.109.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.109.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.109.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.109.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.109.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.109.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.109.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.109.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.109.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.11.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.11.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.11.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.11.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.11.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.11.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.11.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.11.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.11.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.110.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.110.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.110.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.110.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.110.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.110.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.110.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.110.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.110.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.111.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.111.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.111.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.111.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.111.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.111.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.111.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.111.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.111.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.112.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.112.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.112.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.112.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.112.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.112.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.112.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.112.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.112.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.113.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.113.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.113.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.113.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.113.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.113.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.113.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.113.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.113.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.114.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.114.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.114.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.114.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.114.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.114.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.114.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.114.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.114.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.115.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.115.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.115.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.115.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.115.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.115.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.115.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.115.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.115.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.116.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.116.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.116.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.116.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.116.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.116.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.116.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.116.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.116.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.117.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.117.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.117.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.117.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.117.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.117.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.117.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.117.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.117.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.118.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.118.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.118.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.118.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.118.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.118.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.118.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.118.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.118.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.119.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.119.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.119.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.119.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.119.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.119.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.119.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.119.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.119.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.12.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.12.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.12.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.12.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.12.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.12.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.12.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.12.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.12.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.120.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.120.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.120.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.120.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.120.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.120.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.120.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.120.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.120.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.121.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.121.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.121.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.121.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.121.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.121.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.121.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.121.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.121.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.122.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.122.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.122.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.122.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.122.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.122.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.122.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.122.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.122.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.123.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.123.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.123.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.123.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.123.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.123.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.123.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.123.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.123.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.124.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.124.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.124.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.124.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.124.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.124.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.124.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.124.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.124.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.125.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.125.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.125.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.125.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.125.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.125.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.125.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.125.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.125.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.126.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.126.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.126.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.126.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.126.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.126.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.126.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.126.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.126.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.127.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.127.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.127.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.127.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.127.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.127.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.127.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.127.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.127.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.13.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.13.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.13.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.13.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.13.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.13.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.13.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.13.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.13.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.14.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.14.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.14.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.14.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.14.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.14.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.14.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.14.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.14.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.15.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.15.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.15.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.15.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.15.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.15.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.15.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.15.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.15.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.16.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.16.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.16.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.16.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.16.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.16.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.16.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.16.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.16.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.17.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.17.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.17.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.17.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.17.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.17.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.17.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.17.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.17.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.18.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.18.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.18.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.18.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.18.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.18.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.18.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.18.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.18.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.19.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.19.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.19.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.19.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.19.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.19.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.19.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.19.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.19.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.2.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.2.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.2.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.2.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.2.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.2.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.2.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.2.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.2.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.20.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.20.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.20.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.20.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.20.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.20.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.20.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.20.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.20.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.21.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.21.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.21.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.21.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.21.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.21.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.21.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.21.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.21.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.22.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.22.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.22.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.22.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.22.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.22.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.22.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.22.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.22.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.23.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.23.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.23.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.23.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.23.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.23.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.23.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.23.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.23.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.24.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.24.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.24.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.24.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.24.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.24.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.24.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.24.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.24.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.25.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.25.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.25.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.25.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.25.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.25.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.25.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.25.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.25.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.26.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.26.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.26.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.26.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.26.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.26.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.26.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.26.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.26.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.27.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.27.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.27.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.27.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.27.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.27.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.27.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.27.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.27.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.28.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.28.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.28.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.28.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.28.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.28.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.28.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.28.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.28.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.29.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.29.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.29.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.29.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.29.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.29.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.29.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.29.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.29.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.3.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.3.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.3.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.3.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.3.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.3.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.3.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.3.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.3.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.30.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.30.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.30.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.30.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.30.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.30.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.30.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.30.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.30.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.31.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.31.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.31.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.31.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.31.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.31.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.31.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.31.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.31.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.32.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.32.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.32.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.32.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.32.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.32.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.32.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.32.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.32.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.33.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.33.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.33.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.33.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.33.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.33.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.33.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.33.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.33.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.34.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.34.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.34.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.34.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.34.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.34.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.34.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.34.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.34.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.35.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.35.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.35.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.35.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.35.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.35.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.35.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.35.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.35.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.36.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.36.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.36.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.36.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.36.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.36.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.36.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.36.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.36.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.37.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.37.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.37.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.37.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.37.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.37.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.37.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.37.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.37.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.38.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.38.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.38.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.38.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.38.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.38.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.38.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.38.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.38.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.39.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.39.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.39.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.39.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.39.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.39.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.39.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.39.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.39.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.4.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.4.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.4.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.4.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.4.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.4.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.4.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.4.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.4.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.40.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.40.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.40.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.40.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.40.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.40.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.40.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.40.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.40.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.41.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.41.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.41.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.41.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.41.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.41.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.41.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.41.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.41.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.42.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.42.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.42.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.42.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.42.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.42.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.42.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.42.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.42.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.43.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.43.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.43.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.43.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.43.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.43.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.43.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.43.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.43.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.44.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.44.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.44.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.44.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.44.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.44.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.44.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.44.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.44.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.45.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.45.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.45.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.45.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.45.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.45.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.45.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.45.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.45.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.46.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.46.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.46.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.46.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.46.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.46.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.46.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.46.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.46.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.47.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.47.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.47.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.47.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.47.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.47.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.47.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.47.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.47.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.48.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.48.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.48.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.48.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.48.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.48.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.48.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.48.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.48.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.49.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.49.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.49.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.49.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.49.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.49.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.49.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.49.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.49.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.5.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.5.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.5.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.5.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.5.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.5.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.5.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.5.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.5.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.50.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.50.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.50.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.50.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.50.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.50.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.50.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.50.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.50.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.51.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.51.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.51.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.51.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.51.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.51.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.51.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.51.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.51.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.52.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.52.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.52.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.52.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.52.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.52.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.52.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.52.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.52.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.53.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.53.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.53.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.53.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.53.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.53.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.53.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.53.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.53.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.54.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.54.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.54.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.54.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.54.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.54.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.54.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.54.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.54.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.55.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.55.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.55.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.55.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.55.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.55.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.55.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.55.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.55.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.56.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.56.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.56.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.56.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.56.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.56.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.56.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.56.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.56.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.57.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.57.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.57.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.57.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.57.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.57.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.57.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.57.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.57.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.58.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.58.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.58.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.58.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.58.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.58.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.58.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.58.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.58.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.59.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.59.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.59.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.59.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.59.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.59.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.59.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.59.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.59.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.6.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.6.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.6.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.6.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.6.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.6.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.6.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.6.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.6.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.60.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.60.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.60.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.60.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.60.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.60.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.60.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.60.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.60.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.61.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.61.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.61.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.61.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.61.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.61.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.61.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.61.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.61.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.62.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.62.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.62.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.62.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.62.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.62.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.62.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.62.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.62.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.63.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.63.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.63.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.63.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.63.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.63.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.63.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.63.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.63.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.64.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.64.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.64.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.64.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.64.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.64.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.64.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.64.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.64.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.65.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.65.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.65.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.65.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.65.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.65.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.65.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.65.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.65.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.66.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.66.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.66.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.66.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.66.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.66.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.66.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.66.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.66.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.67.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.67.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.67.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.67.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.67.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.67.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.67.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.67.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.67.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.68.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.68.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.68.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.68.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.68.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.68.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.68.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.68.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.68.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.69.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.69.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.69.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.69.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.69.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.69.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.69.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.69.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.69.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.7.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.7.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.7.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.7.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.7.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.7.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.7.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.7.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.7.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.70.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.70.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.70.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.70.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.70.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.70.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.70.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.70.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.70.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.71.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.71.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.71.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.71.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.71.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.71.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.71.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.71.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.71.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.72.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.72.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.72.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.72.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.72.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.72.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.72.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.72.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.72.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.73.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.73.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.73.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.73.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.73.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.73.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.73.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.73.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.73.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.74.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.74.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.74.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.74.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.74.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.74.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.74.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.74.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.74.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.75.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.75.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.75.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.75.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.75.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.75.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.75.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.75.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.75.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.76.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.76.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.76.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.76.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.76.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.76.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.76.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.76.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.76.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.77.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.77.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.77.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.77.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.77.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.77.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.77.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.77.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.77.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.78.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.78.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.78.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.78.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.78.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.78.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.78.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.78.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.78.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.79.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.79.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.79.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.79.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.79.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.79.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.79.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.79.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.79.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.8.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.8.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.8.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.8.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.8.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.8.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.8.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.8.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.8.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.80.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.80.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.80.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.80.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.80.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.80.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.80.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.80.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.80.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.81.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.81.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.81.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.81.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.81.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.81.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.81.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.81.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.81.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.82.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.82.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.82.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.82.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.82.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.82.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.82.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.82.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.82.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.83.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.83.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.83.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.83.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.83.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.83.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.83.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.83.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.83.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.84.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.84.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.84.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.84.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.84.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.84.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.84.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.84.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.84.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.85.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.85.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.85.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.85.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.85.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.85.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.85.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.85.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.85.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.86.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.86.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.86.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.86.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.86.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.86.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.86.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.86.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.86.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.87.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.87.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.87.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.87.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.87.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.87.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.87.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.87.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.87.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.88.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.88.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.88.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.88.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.88.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.88.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.88.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.88.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.88.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.89.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.89.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.89.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.89.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.89.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.89.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.89.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.89.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.89.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.9.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.9.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.9.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.9.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.9.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.9.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.9.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.9.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.9.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.90.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.90.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.90.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.90.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.90.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.90.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.90.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.90.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.90.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.91.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.91.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.91.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.91.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.91.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.91.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.91.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.91.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.91.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.92.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.92.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.92.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.92.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.92.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.92.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.92.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.92.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.92.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.93.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.93.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.93.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.93.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.93.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.93.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.93.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.93.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.93.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.94.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.94.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.94.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.94.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.94.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.94.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.94.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.94.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.94.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.95.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.95.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.95.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.95.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.95.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.95.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.95.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.95.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.95.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.96.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.96.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.96.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.96.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.96.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.96.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.96.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.96.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.96.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.97.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.97.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.97.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.97.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.97.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.97.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.97.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.97.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.97.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.98.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.98.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.98.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.98.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.98.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.98.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.98.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.98.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.98.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.99.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.99.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.99.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.99.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.99.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.99.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.99.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.experts.99.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.experts.99.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.ffn_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.19.gate.weight": "consolidated-00004-of-00013.safetensors", "layers.19.shared_experts.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.shared_experts.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.shared_experts.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.shared_experts.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.shared_experts.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.shared_experts.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.19.shared_experts.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.19.shared_experts.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.19.shared_experts.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.attention.kv_a_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.2.attention.q_a_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.2.attention.wkv_a_with_mqa.weight": "consolidated-00004-of-00013.safetensors", "layers.2.attention.wkv_b.weight": "consolidated-00004-of-00013.safetensors", "layers.2.attention.wo.weight": "consolidated-00004-of-00013.safetensors", "layers.2.attention.wq_a.weight": "consolidated-00004-of-00013.safetensors", "layers.2.attention.wq_b.weight": "consolidated-00004-of-00013.safetensors", "layers.2.attention_norm.weight": "consolidated-00004-of-00013.safetensors", "layers.2.experts.0.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.0.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.0.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.0.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.0.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.0.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.0.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.0.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.0.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.1.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.1.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.1.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.1.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.1.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.1.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.1.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.1.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.1.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.10.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.10.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.10.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.10.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.10.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.10.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.10.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.10.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.10.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.100.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.100.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.100.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.100.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.100.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.100.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.100.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.100.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.100.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.101.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.101.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.101.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.101.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.101.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.101.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.101.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.101.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.101.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.102.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.102.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.102.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.102.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.102.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.102.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.102.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.102.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.102.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.103.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.103.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.103.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.103.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.103.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.103.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.103.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.103.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.103.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.104.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.104.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.104.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.104.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.104.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.104.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.104.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.104.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.104.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.105.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.105.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.105.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.105.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.105.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.105.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.105.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.105.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.105.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.106.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.106.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.106.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.106.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.106.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.106.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.106.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.106.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.106.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.107.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.107.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.107.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.107.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.107.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.107.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.107.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.107.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.107.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.108.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.108.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.108.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.108.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.108.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.108.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.108.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.108.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.108.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.109.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.109.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.109.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.109.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.109.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.109.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.109.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.109.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.109.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.11.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.11.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.11.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.11.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.11.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.11.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.11.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.11.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.11.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.110.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.110.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.110.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.110.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.110.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.110.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.110.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.110.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.110.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.111.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.111.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.111.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.111.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.111.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.111.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.111.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.111.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.111.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.112.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.112.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.112.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.112.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.112.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.112.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.112.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.112.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.112.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.113.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.113.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.113.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.113.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.113.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.113.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.113.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.113.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.113.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.114.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.114.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.114.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.114.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.114.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.114.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.114.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.114.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.114.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.115.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.115.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.115.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.115.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.115.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.115.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.115.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.115.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.115.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.116.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.116.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.116.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.116.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.116.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.116.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.116.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.116.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.116.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.117.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.117.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.117.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.117.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.117.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.117.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.117.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.117.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.117.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.118.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.118.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.118.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.118.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.118.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.118.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.118.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.118.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.118.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.119.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.119.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.119.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.119.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.119.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.119.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.119.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.119.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.119.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.12.w1.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.12.w1.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.12.w1.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.12.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.12.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.12.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.12.w3.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.12.w3.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.12.w3.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.120.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.120.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.120.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.120.w2.weight_global_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.120.w2.weight_packed": "consolidated-00004-of-00013.safetensors", "layers.2.experts.120.w2.weight_scale": "consolidated-00004-of-00013.safetensors", "layers.2.experts.120.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.120.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.120.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.121.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.121.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.121.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.121.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.121.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.121.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.121.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.121.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.121.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.122.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.122.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.122.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.122.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.122.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.122.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.122.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.122.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.122.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.123.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.123.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.123.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.123.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.123.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.123.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.123.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.123.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.123.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.124.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.124.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.124.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.124.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.124.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.124.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.124.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.124.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.124.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.125.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.125.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.125.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.125.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.125.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.125.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.125.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.125.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.125.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.126.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.126.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.126.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.126.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.126.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.126.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.126.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.126.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.126.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.127.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.127.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.127.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.127.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.127.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.127.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.127.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.127.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.127.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.13.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.13.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.13.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.13.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.13.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.13.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.13.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.13.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.13.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.14.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.14.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.14.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.14.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.14.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.14.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.14.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.14.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.14.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.15.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.15.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.15.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.15.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.15.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.15.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.15.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.15.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.15.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.16.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.16.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.16.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.16.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.16.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.16.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.16.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.16.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.16.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.17.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.17.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.17.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.17.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.17.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.17.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.17.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.17.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.17.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.18.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.18.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.18.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.18.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.18.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.18.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.18.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.18.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.18.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.19.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.19.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.19.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.19.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.19.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.19.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.19.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.19.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.19.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.2.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.2.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.2.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.2.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.2.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.2.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.2.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.2.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.2.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.20.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.20.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.20.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.20.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.20.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.20.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.20.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.20.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.20.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.21.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.21.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.21.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.21.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.21.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.21.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.21.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.21.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.21.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.22.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.22.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.22.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.22.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.22.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.22.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.22.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.22.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.22.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.23.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.23.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.23.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.23.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.23.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.23.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.23.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.23.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.23.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.24.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.24.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.24.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.24.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.24.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.24.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.24.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.24.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.24.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.25.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.25.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.25.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.25.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.25.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.25.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.25.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.25.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.25.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.26.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.26.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.26.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.26.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.26.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.26.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.26.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.26.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.26.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.27.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.27.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.27.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.27.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.27.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.27.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.27.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.27.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.27.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.28.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.28.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.28.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.28.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.28.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.28.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.28.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.28.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.28.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.29.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.29.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.29.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.29.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.29.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.29.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.29.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.29.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.29.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.3.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.3.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.3.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.3.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.3.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.3.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.3.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.3.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.3.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.30.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.30.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.30.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.30.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.30.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.30.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.30.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.30.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.30.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.31.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.31.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.31.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.31.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.31.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.31.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.31.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.31.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.31.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.32.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.32.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.32.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.32.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.32.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.32.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.32.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.32.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.32.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.33.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.33.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.33.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.33.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.33.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.33.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.33.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.33.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.33.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.34.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.34.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.34.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.34.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.34.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.34.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.34.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.34.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.34.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.35.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.35.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.35.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.35.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.35.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.35.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.35.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.35.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.35.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.36.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.36.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.36.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.36.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.36.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.36.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.36.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.36.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.36.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.37.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.37.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.37.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.37.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.37.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.37.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.37.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.37.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.37.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.38.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.38.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.38.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.38.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.38.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.38.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.38.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.38.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.38.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.39.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.39.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.39.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.39.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.39.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.39.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.39.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.39.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.39.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.4.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.4.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.4.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.4.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.4.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.4.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.4.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.4.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.4.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.40.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.40.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.40.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.40.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.40.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.40.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.40.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.40.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.40.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.41.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.41.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.41.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.41.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.41.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.41.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.41.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.41.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.41.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.42.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.42.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.42.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.42.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.42.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.42.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.42.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.42.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.42.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.43.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.43.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.43.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.43.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.43.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.43.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.43.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.43.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.43.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.44.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.44.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.44.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.44.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.44.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.44.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.44.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.44.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.44.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.45.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.45.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.45.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.45.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.45.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.45.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.45.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.45.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.45.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.46.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.46.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.46.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.46.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.46.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.46.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.46.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.46.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.46.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.47.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.47.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.47.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.47.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.47.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.47.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.47.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.47.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.47.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.48.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.48.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.48.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.48.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.48.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.48.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.48.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.48.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.48.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.49.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.49.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.49.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.49.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.49.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.49.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.49.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.49.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.49.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.5.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.5.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.5.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.5.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.5.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.5.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.5.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.5.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.5.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.50.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.50.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.50.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.50.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.50.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.50.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.50.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.50.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.50.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.51.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.51.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.51.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.51.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.51.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.51.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.51.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.51.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.51.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.52.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.52.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.52.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.52.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.52.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.52.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.52.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.52.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.52.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.53.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.53.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.53.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.53.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.53.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.53.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.53.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.53.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.53.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.54.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.54.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.54.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.54.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.54.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.54.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.54.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.54.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.54.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.55.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.55.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.55.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.55.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.55.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.55.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.55.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.55.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.55.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.56.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.56.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.56.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.56.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.56.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.56.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.56.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.56.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.56.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.57.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.57.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.57.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.57.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.57.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.57.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.57.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.57.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.57.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.58.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.58.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.58.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.58.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.58.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.58.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.58.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.58.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.58.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.59.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.59.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.59.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.59.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.59.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.59.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.59.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.59.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.59.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.6.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.6.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.6.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.6.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.6.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.6.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.6.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.6.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.6.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.60.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.60.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.60.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.60.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.60.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.60.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.60.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.60.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.60.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.61.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.61.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.61.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.61.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.61.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.61.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.61.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.61.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.61.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.62.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.62.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.62.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.62.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.62.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.62.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.62.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.62.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.62.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.63.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.63.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.63.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.63.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.63.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.63.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.63.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.63.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.63.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.64.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.64.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.64.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.64.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.64.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.64.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.64.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.64.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.64.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.65.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.65.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.65.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.65.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.65.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.65.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.65.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.65.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.65.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.66.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.66.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.66.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.66.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.66.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.66.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.66.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.66.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.66.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.67.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.67.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.67.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.67.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.67.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.67.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.67.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.67.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.67.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.68.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.68.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.68.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.68.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.68.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.68.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.68.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.68.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.68.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.69.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.69.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.69.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.69.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.69.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.69.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.69.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.69.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.69.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.7.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.7.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.7.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.7.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.7.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.7.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.7.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.7.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.7.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.70.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.70.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.70.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.70.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.70.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.70.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.70.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.70.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.70.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.71.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.71.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.71.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.71.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.71.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.71.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.71.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.71.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.71.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.72.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.72.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.72.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.72.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.72.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.72.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.72.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.72.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.72.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.73.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.73.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.73.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.73.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.73.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.73.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.73.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.73.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.73.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.74.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.74.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.74.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.74.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.74.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.74.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.74.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.74.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.74.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.75.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.75.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.75.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.75.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.75.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.75.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.75.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.75.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.75.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.76.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.76.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.76.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.76.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.76.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.76.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.76.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.76.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.76.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.77.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.77.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.77.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.77.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.77.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.77.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.77.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.77.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.77.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.78.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.78.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.78.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.78.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.78.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.78.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.78.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.78.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.78.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.79.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.79.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.79.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.79.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.79.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.79.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.79.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.79.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.79.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.8.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.8.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.8.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.8.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.8.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.8.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.8.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.8.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.8.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.80.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.80.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.80.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.80.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.80.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.80.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.80.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.80.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.80.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.81.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.81.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.81.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.81.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.81.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.81.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.81.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.81.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.81.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.82.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.82.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.82.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.82.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.82.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.82.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.82.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.82.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.82.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.83.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.83.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.83.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.83.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.83.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.83.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.83.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.83.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.83.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.84.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.84.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.84.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.84.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.84.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.84.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.84.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.84.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.84.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.85.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.85.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.85.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.85.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.85.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.85.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.85.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.85.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.85.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.86.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.86.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.86.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.86.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.86.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.86.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.86.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.86.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.86.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.87.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.87.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.87.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.87.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.87.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.87.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.87.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.87.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.87.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.88.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.88.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.88.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.88.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.88.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.88.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.88.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.88.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.88.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.89.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.89.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.89.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.89.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.89.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.89.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.89.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.89.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.89.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.9.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.9.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.9.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.9.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.9.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.9.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.9.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.9.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.9.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.90.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.90.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.90.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.90.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.90.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.90.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.90.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.90.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.90.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.91.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.91.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.91.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.91.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.91.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.91.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.91.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.91.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.91.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.92.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.92.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.92.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.92.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.92.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.92.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.92.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.92.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.92.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.93.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.93.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.93.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.93.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.93.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.93.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.93.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.93.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.93.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.94.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.94.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.94.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.94.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.94.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.94.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.94.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.94.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.94.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.95.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.95.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.95.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.95.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.95.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.95.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.95.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.95.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.95.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.96.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.96.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.96.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.96.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.96.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.96.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.96.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.96.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.96.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.97.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.97.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.97.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.97.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.97.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.97.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.97.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.97.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.97.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.98.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.98.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.98.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.98.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.98.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.98.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.98.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.98.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.98.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.99.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.99.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.99.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.99.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.99.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.99.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.99.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.experts.99.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.experts.99.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.ffn_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.2.gate.weight": "consolidated-00005-of-00013.safetensors", "layers.2.shared_experts.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.shared_experts.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.shared_experts.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.shared_experts.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.shared_experts.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.shared_experts.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.2.shared_experts.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.2.shared_experts.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.2.shared_experts.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.attention.kv_a_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.20.attention.q_a_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.20.attention.wkv_a_with_mqa.weight": "consolidated-00005-of-00013.safetensors", "layers.20.attention.wkv_b.weight": "consolidated-00005-of-00013.safetensors", "layers.20.attention.wo.weight": "consolidated-00005-of-00013.safetensors", "layers.20.attention.wq_a.weight": "consolidated-00005-of-00013.safetensors", "layers.20.attention.wq_b.weight": "consolidated-00005-of-00013.safetensors", "layers.20.attention_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.20.experts.0.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.0.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.0.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.0.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.0.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.0.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.0.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.0.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.0.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.1.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.1.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.1.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.1.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.1.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.1.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.1.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.1.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.1.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.10.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.10.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.10.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.10.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.10.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.10.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.10.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.10.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.10.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.100.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.100.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.100.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.100.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.100.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.100.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.100.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.100.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.100.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.101.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.101.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.101.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.101.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.101.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.101.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.101.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.101.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.101.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.102.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.102.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.102.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.102.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.102.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.102.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.102.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.102.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.102.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.103.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.103.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.103.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.103.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.103.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.103.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.103.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.103.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.103.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.104.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.104.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.104.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.104.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.104.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.104.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.104.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.104.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.104.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.105.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.105.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.105.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.105.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.105.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.105.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.105.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.105.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.105.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.106.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.106.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.106.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.106.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.106.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.106.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.106.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.106.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.106.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.107.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.107.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.107.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.107.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.107.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.107.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.107.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.107.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.107.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.108.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.108.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.108.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.108.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.108.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.108.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.108.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.108.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.108.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.109.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.109.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.109.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.109.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.109.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.109.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.109.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.109.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.109.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.11.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.11.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.11.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.11.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.11.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.11.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.11.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.11.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.11.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.110.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.110.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.110.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.110.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.110.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.110.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.110.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.110.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.110.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.111.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.111.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.111.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.111.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.111.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.111.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.111.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.111.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.111.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.112.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.112.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.112.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.112.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.112.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.112.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.112.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.112.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.112.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.113.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.113.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.113.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.113.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.113.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.113.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.113.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.113.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.113.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.114.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.114.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.114.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.114.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.114.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.114.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.114.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.114.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.114.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.115.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.115.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.115.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.115.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.115.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.115.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.115.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.115.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.115.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.116.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.116.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.116.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.116.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.116.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.116.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.116.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.116.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.116.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.117.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.117.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.117.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.117.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.117.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.117.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.117.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.117.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.117.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.118.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.118.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.118.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.118.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.118.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.118.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.118.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.118.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.118.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.119.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.119.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.119.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.119.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.119.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.119.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.119.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.119.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.119.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.12.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.12.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.12.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.12.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.12.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.12.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.12.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.12.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.12.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.120.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.120.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.120.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.120.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.120.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.120.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.120.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.120.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.120.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.121.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.121.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.121.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.121.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.121.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.121.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.121.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.121.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.121.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.122.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.122.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.122.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.122.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.122.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.122.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.122.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.122.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.122.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.123.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.123.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.123.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.123.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.123.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.123.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.123.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.123.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.123.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.124.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.124.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.124.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.124.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.124.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.124.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.124.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.124.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.124.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.125.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.125.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.125.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.125.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.125.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.125.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.125.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.125.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.125.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.126.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.126.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.126.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.126.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.126.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.126.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.126.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.126.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.126.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.127.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.127.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.127.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.127.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.127.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.127.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.127.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.127.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.127.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.13.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.13.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.13.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.13.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.13.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.13.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.13.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.13.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.13.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.14.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.14.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.14.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.14.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.14.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.14.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.14.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.14.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.14.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.15.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.15.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.15.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.15.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.15.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.15.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.15.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.15.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.15.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.16.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.16.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.16.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.16.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.16.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.16.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.16.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.16.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.16.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.17.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.17.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.17.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.17.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.17.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.17.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.17.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.17.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.17.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.18.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.18.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.18.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.18.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.18.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.18.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.18.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.18.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.18.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.19.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.19.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.19.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.19.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.19.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.19.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.19.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.19.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.19.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.2.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.2.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.2.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.2.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.2.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.2.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.2.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.2.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.2.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.20.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.20.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.20.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.20.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.20.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.20.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.20.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.20.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.20.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.21.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.21.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.21.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.21.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.21.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.21.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.21.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.21.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.21.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.22.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.22.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.22.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.22.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.22.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.22.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.22.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.22.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.22.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.23.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.23.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.23.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.23.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.23.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.23.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.23.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.23.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.23.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.24.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.24.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.24.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.24.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.24.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.24.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.24.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.24.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.24.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.25.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.25.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.25.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.25.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.25.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.25.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.25.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.25.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.25.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.26.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.26.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.26.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.26.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.26.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.26.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.26.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.26.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.26.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.27.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.27.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.27.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.27.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.27.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.27.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.27.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.27.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.27.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.28.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.28.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.28.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.28.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.28.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.28.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.28.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.28.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.28.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.29.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.29.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.29.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.29.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.29.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.29.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.29.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.29.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.29.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.3.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.3.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.3.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.3.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.3.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.3.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.3.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.3.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.3.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.30.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.30.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.30.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.30.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.30.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.30.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.30.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.30.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.30.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.31.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.31.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.31.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.31.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.31.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.31.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.31.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.31.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.31.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.32.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.32.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.32.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.32.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.32.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.32.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.32.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.32.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.32.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.33.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.33.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.33.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.33.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.33.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.33.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.33.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.33.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.33.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.34.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.34.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.34.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.34.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.34.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.34.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.34.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.34.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.34.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.35.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.35.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.35.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.35.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.35.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.35.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.35.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.35.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.35.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.36.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.36.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.36.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.36.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.36.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.36.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.36.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.36.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.36.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.37.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.37.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.37.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.37.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.37.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.37.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.37.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.37.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.37.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.38.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.38.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.38.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.38.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.38.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.38.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.38.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.38.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.38.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.39.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.39.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.39.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.39.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.39.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.39.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.39.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.39.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.39.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.4.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.4.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.4.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.4.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.4.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.4.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.4.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.4.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.4.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.40.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.40.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.40.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.40.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.40.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.40.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.40.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.40.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.40.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.41.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.41.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.41.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.41.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.41.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.41.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.41.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.41.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.41.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.42.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.42.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.42.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.42.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.42.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.42.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.42.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.42.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.42.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.43.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.43.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.43.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.43.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.43.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.43.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.43.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.43.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.43.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.44.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.44.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.44.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.44.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.44.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.44.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.44.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.44.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.44.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.45.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.45.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.45.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.45.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.45.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.45.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.45.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.45.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.45.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.46.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.46.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.46.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.46.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.46.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.46.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.46.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.46.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.46.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.47.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.47.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.47.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.47.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.47.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.47.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.47.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.47.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.47.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.48.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.48.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.48.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.48.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.48.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.48.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.48.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.48.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.48.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.49.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.49.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.49.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.49.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.49.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.49.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.49.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.49.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.49.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.5.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.5.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.5.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.5.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.5.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.5.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.5.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.5.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.5.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.50.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.50.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.50.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.50.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.50.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.50.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.50.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.50.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.50.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.51.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.51.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.51.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.51.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.51.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.51.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.51.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.51.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.51.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.52.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.52.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.52.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.52.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.52.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.52.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.52.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.52.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.52.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.53.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.53.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.53.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.53.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.53.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.53.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.53.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.53.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.53.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.54.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.54.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.54.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.54.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.54.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.54.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.54.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.54.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.54.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.55.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.55.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.55.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.55.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.55.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.55.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.55.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.55.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.55.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.56.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.56.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.56.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.56.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.56.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.56.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.56.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.56.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.56.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.57.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.57.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.57.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.57.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.57.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.57.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.57.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.57.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.57.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.58.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.58.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.58.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.58.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.58.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.58.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.58.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.58.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.58.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.59.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.59.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.59.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.59.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.59.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.59.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.59.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.59.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.59.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.6.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.6.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.6.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.6.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.6.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.6.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.6.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.6.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.6.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.60.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.60.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.60.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.60.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.60.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.60.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.60.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.60.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.60.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.61.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.61.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.61.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.61.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.61.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.61.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.61.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.61.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.61.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.62.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.62.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.62.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.62.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.62.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.62.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.62.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.62.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.62.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.63.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.63.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.63.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.63.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.63.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.63.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.63.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.63.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.63.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.64.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.64.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.64.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.64.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.64.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.64.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.64.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.64.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.64.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.65.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.65.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.65.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.65.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.65.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.65.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.65.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.65.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.65.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.66.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.66.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.66.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.66.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.66.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.66.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.66.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.66.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.66.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.67.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.67.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.67.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.67.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.67.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.67.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.67.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.67.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.67.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.68.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.68.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.68.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.68.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.68.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.68.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.68.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.68.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.68.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.69.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.69.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.69.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.69.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.69.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.69.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.69.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.69.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.69.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.7.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.7.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.7.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.7.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.7.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.7.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.7.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.7.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.7.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.70.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.70.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.70.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.70.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.70.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.70.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.70.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.70.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.70.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.71.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.71.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.71.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.71.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.71.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.71.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.71.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.71.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.71.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.72.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.72.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.72.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.72.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.72.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.72.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.72.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.72.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.72.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.73.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.73.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.73.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.73.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.73.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.73.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.73.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.73.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.73.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.74.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.74.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.74.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.74.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.74.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.74.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.74.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.74.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.74.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.75.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.75.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.75.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.75.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.75.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.75.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.75.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.75.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.75.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.76.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.76.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.76.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.76.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.76.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.76.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.76.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.76.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.76.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.77.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.77.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.77.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.77.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.77.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.77.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.77.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.77.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.77.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.78.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.78.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.78.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.78.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.78.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.78.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.78.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.78.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.78.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.79.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.79.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.79.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.79.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.79.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.79.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.79.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.79.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.79.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.8.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.8.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.8.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.8.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.8.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.8.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.8.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.8.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.8.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.80.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.80.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.80.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.80.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.80.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.80.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.80.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.80.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.80.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.81.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.81.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.81.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.81.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.81.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.81.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.81.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.81.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.81.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.82.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.82.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.82.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.82.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.82.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.82.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.82.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.82.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.82.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.83.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.83.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.83.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.83.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.83.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.83.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.83.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.83.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.83.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.84.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.84.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.84.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.84.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.84.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.84.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.84.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.84.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.84.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.85.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.85.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.85.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.85.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.85.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.85.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.85.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.85.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.85.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.86.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.86.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.86.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.86.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.86.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.86.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.86.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.86.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.86.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.87.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.87.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.87.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.87.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.87.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.87.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.87.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.87.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.87.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.88.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.88.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.88.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.88.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.88.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.88.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.88.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.88.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.88.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.89.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.89.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.89.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.89.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.89.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.89.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.89.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.89.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.89.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.9.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.9.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.9.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.9.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.9.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.9.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.9.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.9.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.9.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.90.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.90.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.90.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.90.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.90.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.90.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.90.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.90.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.90.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.91.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.91.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.91.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.91.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.91.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.91.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.91.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.91.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.91.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.92.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.92.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.92.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.92.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.92.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.92.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.92.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.92.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.92.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.93.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.93.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.93.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.93.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.93.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.93.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.93.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.93.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.93.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.94.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.94.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.94.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.94.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.94.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.94.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.94.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.94.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.94.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.95.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.95.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.95.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.95.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.95.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.95.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.95.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.95.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.95.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.96.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.96.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.96.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.96.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.96.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.96.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.96.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.96.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.96.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.97.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.97.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.97.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.97.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.97.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.97.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.97.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.97.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.97.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.98.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.98.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.98.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.98.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.98.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.98.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.98.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.98.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.98.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.99.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.99.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.99.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.99.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.99.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.99.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.99.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.experts.99.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.experts.99.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.ffn_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.20.gate.weight": "consolidated-00005-of-00013.safetensors", "layers.20.shared_experts.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.shared_experts.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.shared_experts.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.shared_experts.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.shared_experts.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.shared_experts.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.20.shared_experts.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.20.shared_experts.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.20.shared_experts.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.attention.kv_a_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.21.attention.q_a_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.21.attention.wkv_a_with_mqa.weight": "consolidated-00005-of-00013.safetensors", "layers.21.attention.wkv_b.weight": "consolidated-00005-of-00013.safetensors", "layers.21.attention.wo.weight": "consolidated-00005-of-00013.safetensors", "layers.21.attention.wq_a.weight": "consolidated-00005-of-00013.safetensors", "layers.21.attention.wq_b.weight": "consolidated-00005-of-00013.safetensors", "layers.21.attention_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.21.experts.0.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.0.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.0.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.0.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.0.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.0.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.0.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.0.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.0.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.1.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.1.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.1.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.1.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.1.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.1.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.1.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.1.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.1.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.10.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.10.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.10.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.10.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.10.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.10.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.10.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.10.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.10.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.100.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.100.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.100.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.100.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.100.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.100.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.100.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.100.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.100.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.101.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.101.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.101.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.101.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.101.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.101.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.101.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.101.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.101.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.102.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.102.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.102.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.102.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.102.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.102.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.102.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.102.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.102.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.103.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.103.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.103.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.103.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.103.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.103.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.103.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.103.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.103.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.104.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.104.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.104.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.104.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.104.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.104.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.104.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.104.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.104.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.105.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.105.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.105.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.105.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.105.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.105.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.105.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.105.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.105.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.106.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.106.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.106.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.106.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.106.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.106.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.106.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.106.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.106.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.107.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.107.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.107.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.107.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.107.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.107.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.107.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.107.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.107.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.108.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.108.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.108.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.108.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.108.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.108.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.108.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.108.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.108.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.109.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.109.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.109.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.109.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.109.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.109.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.109.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.109.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.109.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.11.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.11.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.11.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.11.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.11.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.11.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.11.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.11.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.11.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.110.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.110.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.110.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.110.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.110.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.110.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.110.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.110.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.110.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.111.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.111.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.111.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.111.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.111.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.111.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.111.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.111.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.111.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.112.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.112.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.112.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.112.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.112.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.112.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.112.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.112.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.112.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.113.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.113.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.113.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.113.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.113.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.113.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.113.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.113.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.113.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.114.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.114.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.114.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.114.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.114.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.114.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.114.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.114.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.114.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.115.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.115.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.115.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.115.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.115.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.115.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.115.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.115.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.115.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.116.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.116.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.116.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.116.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.116.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.116.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.116.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.116.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.116.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.117.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.117.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.117.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.117.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.117.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.117.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.117.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.117.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.117.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.118.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.118.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.118.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.118.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.118.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.118.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.118.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.118.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.118.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.119.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.119.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.119.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.119.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.119.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.119.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.119.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.119.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.119.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.12.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.12.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.12.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.12.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.12.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.12.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.12.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.12.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.12.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.120.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.120.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.120.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.120.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.120.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.120.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.120.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.120.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.120.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.121.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.121.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.121.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.121.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.121.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.121.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.121.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.121.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.121.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.122.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.122.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.122.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.122.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.122.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.122.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.122.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.122.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.122.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.123.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.123.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.123.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.123.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.123.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.123.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.123.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.123.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.123.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.124.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.124.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.124.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.124.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.124.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.124.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.124.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.124.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.124.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.125.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.125.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.125.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.125.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.125.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.125.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.125.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.125.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.125.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.126.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.126.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.126.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.126.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.126.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.126.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.126.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.126.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.126.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.127.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.127.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.127.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.127.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.127.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.127.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.127.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.127.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.127.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.13.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.13.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.13.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.13.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.13.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.13.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.13.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.13.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.13.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.14.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.14.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.14.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.14.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.14.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.14.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.14.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.14.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.14.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.15.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.15.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.15.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.15.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.15.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.15.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.15.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.15.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.15.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.16.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.16.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.16.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.16.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.16.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.16.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.16.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.16.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.16.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.17.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.17.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.17.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.17.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.17.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.17.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.17.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.17.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.17.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.18.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.18.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.18.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.18.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.18.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.18.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.18.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.18.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.18.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.19.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.19.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.19.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.19.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.19.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.19.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.19.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.19.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.19.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.2.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.2.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.2.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.2.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.2.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.2.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.2.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.2.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.2.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.20.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.20.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.20.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.20.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.20.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.20.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.20.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.20.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.20.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.21.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.21.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.21.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.21.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.21.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.21.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.21.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.21.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.21.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.22.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.22.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.22.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.22.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.22.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.22.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.22.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.22.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.22.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.23.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.23.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.23.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.23.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.23.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.23.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.23.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.23.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.23.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.24.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.24.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.24.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.24.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.24.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.24.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.24.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.24.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.24.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.25.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.25.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.25.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.25.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.25.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.25.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.25.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.25.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.25.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.26.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.26.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.26.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.26.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.26.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.26.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.26.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.26.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.26.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.27.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.27.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.27.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.27.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.27.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.27.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.27.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.27.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.27.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.28.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.28.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.28.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.28.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.28.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.28.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.28.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.28.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.28.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.29.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.29.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.29.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.29.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.29.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.29.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.29.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.29.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.29.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.3.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.3.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.3.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.3.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.3.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.3.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.3.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.3.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.3.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.30.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.30.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.30.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.30.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.30.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.30.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.30.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.30.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.30.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.31.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.31.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.31.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.31.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.31.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.31.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.31.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.31.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.31.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.32.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.32.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.32.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.32.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.32.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.32.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.32.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.32.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.32.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.33.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.33.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.33.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.33.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.33.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.33.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.33.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.33.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.33.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.34.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.34.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.34.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.34.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.34.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.34.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.34.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.34.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.34.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.35.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.35.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.35.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.35.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.35.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.35.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.35.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.35.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.35.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.36.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.36.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.36.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.36.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.36.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.36.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.36.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.36.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.36.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.37.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.37.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.37.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.37.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.37.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.37.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.37.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.37.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.37.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.38.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.38.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.38.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.38.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.38.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.38.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.38.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.38.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.38.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.39.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.39.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.39.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.39.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.39.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.39.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.39.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.39.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.39.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.4.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.4.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.4.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.4.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.4.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.4.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.4.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.4.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.4.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.40.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.40.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.40.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.40.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.40.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.40.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.40.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.40.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.40.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.41.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.41.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.41.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.41.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.41.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.41.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.41.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.41.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.41.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.42.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.42.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.42.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.42.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.42.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.42.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.42.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.42.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.42.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.43.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.43.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.43.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.43.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.43.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.43.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.43.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.43.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.43.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.44.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.44.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.44.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.44.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.44.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.44.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.44.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.44.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.44.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.45.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.45.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.45.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.45.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.45.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.45.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.45.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.45.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.45.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.46.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.46.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.46.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.46.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.46.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.46.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.46.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.46.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.46.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.47.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.47.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.47.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.47.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.47.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.47.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.47.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.47.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.47.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.48.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.48.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.48.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.48.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.48.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.48.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.48.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.48.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.48.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.49.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.49.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.49.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.49.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.49.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.49.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.49.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.49.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.49.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.5.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.5.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.5.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.5.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.5.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.5.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.5.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.5.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.5.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.50.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.50.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.50.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.50.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.50.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.50.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.50.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.50.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.50.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.51.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.51.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.51.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.51.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.51.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.51.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.51.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.51.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.51.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.52.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.52.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.52.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.52.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.52.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.52.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.52.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.52.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.52.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.53.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.53.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.53.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.53.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.53.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.53.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.53.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.53.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.53.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.54.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.54.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.54.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.54.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.54.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.54.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.54.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.54.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.54.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.55.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.55.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.55.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.55.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.55.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.55.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.55.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.55.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.55.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.56.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.56.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.56.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.56.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.56.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.56.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.56.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.56.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.56.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.57.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.57.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.57.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.57.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.57.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.57.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.57.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.57.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.57.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.58.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.58.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.58.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.58.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.58.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.58.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.58.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.58.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.58.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.59.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.59.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.59.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.59.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.59.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.59.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.59.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.59.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.59.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.6.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.6.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.6.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.6.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.6.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.6.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.6.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.6.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.6.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.60.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.60.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.60.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.60.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.60.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.60.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.60.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.60.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.60.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.61.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.61.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.61.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.61.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.61.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.61.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.61.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.61.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.61.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.62.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.62.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.62.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.62.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.62.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.62.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.62.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.62.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.62.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.63.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.63.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.63.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.63.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.63.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.63.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.63.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.63.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.63.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.64.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.64.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.64.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.64.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.64.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.64.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.64.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.64.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.64.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.65.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.65.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.65.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.65.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.65.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.65.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.65.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.65.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.65.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.66.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.66.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.66.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.66.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.66.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.66.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.66.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.66.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.66.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.67.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.67.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.67.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.67.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.67.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.67.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.67.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.67.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.67.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.68.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.68.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.68.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.68.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.68.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.68.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.68.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.68.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.68.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.69.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.69.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.69.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.69.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.69.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.69.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.69.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.69.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.69.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.7.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.7.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.7.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.7.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.7.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.7.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.7.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.7.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.7.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.70.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.70.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.70.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.70.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.70.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.70.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.70.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.70.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.70.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.71.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.71.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.71.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.71.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.71.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.71.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.71.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.71.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.71.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.72.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.72.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.72.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.72.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.72.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.72.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.72.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.72.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.72.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.73.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.73.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.73.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.73.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.73.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.73.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.73.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.73.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.73.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.74.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.74.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.74.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.74.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.74.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.74.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.74.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.74.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.74.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.75.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.75.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.75.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.75.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.75.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.75.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.75.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.75.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.75.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.76.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.76.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.76.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.76.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.76.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.76.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.76.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.76.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.76.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.77.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.77.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.77.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.77.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.77.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.77.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.77.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.77.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.77.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.78.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.78.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.78.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.78.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.78.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.78.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.78.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.78.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.78.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.79.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.79.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.79.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.79.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.79.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.79.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.79.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.79.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.79.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.8.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.8.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.8.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.8.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.8.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.8.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.8.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.8.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.8.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.80.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.80.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.80.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.80.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.80.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.80.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.80.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.80.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.80.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.81.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.81.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.81.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.81.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.81.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.81.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.81.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.81.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.81.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.82.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.82.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.82.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.82.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.82.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.82.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.82.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.82.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.82.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.83.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.83.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.83.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.83.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.83.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.83.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.83.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.83.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.83.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.84.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.84.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.84.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.84.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.84.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.84.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.84.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.84.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.84.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.85.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.85.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.85.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.85.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.85.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.85.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.85.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.85.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.85.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.86.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.86.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.86.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.86.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.86.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.86.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.86.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.86.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.86.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.87.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.87.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.87.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.87.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.87.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.87.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.87.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.87.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.87.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.88.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.88.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.88.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.88.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.88.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.88.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.88.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.88.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.88.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.89.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.89.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.89.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.89.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.89.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.89.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.89.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.89.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.89.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.9.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.9.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.9.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.9.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.9.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.9.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.9.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.9.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.9.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.90.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.90.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.90.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.90.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.90.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.90.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.90.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.90.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.90.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.91.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.91.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.91.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.91.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.91.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.91.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.91.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.91.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.91.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.92.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.92.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.92.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.92.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.92.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.92.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.92.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.92.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.92.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.93.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.93.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.93.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.93.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.93.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.93.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.93.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.93.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.93.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.94.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.94.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.94.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.94.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.94.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.94.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.94.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.94.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.94.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.95.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.95.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.95.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.95.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.95.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.95.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.95.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.95.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.95.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.96.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.96.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.96.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.96.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.96.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.96.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.96.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.96.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.96.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.97.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.97.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.97.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.97.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.97.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.97.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.97.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.97.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.97.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.98.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.98.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.98.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.98.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.98.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.98.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.98.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.98.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.98.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.99.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.99.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.99.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.99.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.99.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.99.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.99.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.experts.99.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.experts.99.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.ffn_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.21.gate.weight": "consolidated-00005-of-00013.safetensors", "layers.21.shared_experts.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.shared_experts.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.shared_experts.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.shared_experts.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.shared_experts.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.shared_experts.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.21.shared_experts.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.21.shared_experts.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.21.shared_experts.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.attention.kv_a_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.22.attention.q_a_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.22.attention.wkv_a_with_mqa.weight": "consolidated-00005-of-00013.safetensors", "layers.22.attention.wkv_b.weight": "consolidated-00005-of-00013.safetensors", "layers.22.attention.wo.weight": "consolidated-00005-of-00013.safetensors", "layers.22.attention.wq_a.weight": "consolidated-00005-of-00013.safetensors", "layers.22.attention.wq_b.weight": "consolidated-00005-of-00013.safetensors", "layers.22.attention_norm.weight": "consolidated-00005-of-00013.safetensors", "layers.22.experts.0.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.0.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.0.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.0.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.0.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.0.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.0.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.0.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.0.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.1.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.1.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.1.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.1.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.1.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.1.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.1.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.1.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.1.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.10.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.10.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.10.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.10.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.10.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.10.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.10.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.10.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.10.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.100.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.100.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.100.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.100.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.100.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.100.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.100.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.100.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.100.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.101.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.101.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.101.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.101.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.101.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.101.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.101.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.101.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.101.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.102.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.102.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.102.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.102.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.102.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.102.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.102.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.102.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.102.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.103.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.103.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.103.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.103.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.103.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.103.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.103.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.103.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.103.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.104.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.104.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.104.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.104.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.104.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.104.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.104.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.104.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.104.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.105.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.105.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.105.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.105.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.105.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.105.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.105.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.105.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.105.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.106.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.106.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.106.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.106.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.106.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.106.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.106.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.106.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.106.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.107.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.107.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.107.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.107.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.107.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.107.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.107.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.107.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.107.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.108.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.108.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.108.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.108.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.108.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.108.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.108.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.108.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.108.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.109.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.109.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.109.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.109.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.109.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.109.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.109.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.109.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.109.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.11.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.11.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.11.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.11.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.11.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.11.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.11.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.11.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.11.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.110.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.110.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.110.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.110.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.110.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.110.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.110.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.110.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.110.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.111.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.111.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.111.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.111.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.111.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.111.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.111.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.111.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.111.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.112.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.112.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.112.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.112.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.112.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.112.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.112.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.112.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.112.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.113.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.113.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.113.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.113.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.113.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.113.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.113.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.113.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.113.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.114.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.114.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.114.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.114.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.114.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.114.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.114.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.114.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.114.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.115.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.115.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.115.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.115.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.115.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.115.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.115.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.115.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.115.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.116.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.116.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.116.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.116.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.116.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.116.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.116.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.116.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.116.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.117.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.117.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.117.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.117.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.117.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.117.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.117.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.117.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.117.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.118.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.118.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.118.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.118.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.118.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.118.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.118.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.118.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.118.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.119.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.119.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.119.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.119.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.119.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.119.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.119.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.119.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.119.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.12.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.12.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.12.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.12.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.12.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.12.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.12.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.12.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.12.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.120.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.120.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.120.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.120.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.120.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.120.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.120.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.120.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.120.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.121.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.121.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.121.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.121.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.121.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.121.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.121.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.121.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.121.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.122.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.122.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.122.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.122.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.122.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.122.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.122.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.122.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.122.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.123.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.123.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.123.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.123.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.123.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.123.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.123.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.123.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.123.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.124.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.124.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.124.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.124.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.124.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.124.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.124.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.124.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.124.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.125.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.125.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.125.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.125.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.125.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.125.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.125.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.125.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.125.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.126.w1.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.126.w1.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.126.w1.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.126.w2.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.126.w2.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.126.w2.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.126.w3.weight_global_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.126.w3.weight_packed": "consolidated-00005-of-00013.safetensors", "layers.22.experts.126.w3.weight_scale": "consolidated-00005-of-00013.safetensors", "layers.22.experts.127.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.127.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.127.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.127.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.127.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.127.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.127.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.127.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.127.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.13.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.13.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.13.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.13.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.13.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.13.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.13.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.13.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.13.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.14.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.14.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.14.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.14.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.14.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.14.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.14.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.14.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.14.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.15.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.15.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.15.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.15.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.15.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.15.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.15.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.15.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.15.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.16.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.16.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.16.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.16.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.16.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.16.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.16.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.16.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.16.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.17.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.17.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.17.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.17.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.17.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.17.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.17.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.17.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.17.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.18.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.18.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.18.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.18.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.18.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.18.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.18.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.18.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.18.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.19.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.19.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.19.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.19.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.19.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.19.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.19.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.19.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.19.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.2.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.2.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.2.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.2.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.2.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.2.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.2.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.2.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.2.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.20.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.20.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.20.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.20.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.20.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.20.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.20.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.20.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.20.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.21.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.21.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.21.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.21.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.21.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.21.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.21.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.21.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.21.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.22.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.22.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.22.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.22.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.22.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.22.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.22.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.22.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.22.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.23.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.23.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.23.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.23.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.23.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.23.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.23.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.23.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.23.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.24.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.24.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.24.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.24.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.24.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.24.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.24.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.24.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.24.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.25.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.25.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.25.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.25.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.25.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.25.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.25.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.25.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.25.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.26.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.26.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.26.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.26.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.26.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.26.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.26.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.26.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.26.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.27.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.27.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.27.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.27.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.27.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.27.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.27.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.27.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.27.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.28.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.28.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.28.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.28.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.28.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.28.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.28.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.28.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.28.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.29.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.29.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.29.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.29.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.29.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.29.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.29.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.29.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.29.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.3.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.3.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.3.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.3.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.3.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.3.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.3.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.3.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.3.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.30.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.30.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.30.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.30.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.30.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.30.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.30.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.30.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.30.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.31.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.31.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.31.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.31.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.31.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.31.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.31.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.31.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.31.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.32.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.32.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.32.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.32.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.32.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.32.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.32.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.32.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.32.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.33.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.33.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.33.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.33.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.33.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.33.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.33.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.33.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.33.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.34.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.34.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.34.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.34.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.34.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.34.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.34.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.34.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.34.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.35.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.35.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.35.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.35.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.35.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.35.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.35.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.35.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.35.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.36.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.36.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.36.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.36.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.36.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.36.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.36.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.36.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.36.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.37.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.37.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.37.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.37.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.37.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.37.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.37.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.37.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.37.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.38.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.38.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.38.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.38.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.38.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.38.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.38.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.38.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.38.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.39.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.39.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.39.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.39.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.39.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.39.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.39.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.39.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.39.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.4.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.4.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.4.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.4.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.4.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.4.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.4.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.4.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.4.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.40.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.40.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.40.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.40.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.40.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.40.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.40.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.40.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.40.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.41.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.41.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.41.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.41.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.41.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.41.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.41.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.41.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.41.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.42.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.42.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.42.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.42.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.42.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.42.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.42.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.42.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.42.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.43.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.43.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.43.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.43.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.43.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.43.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.43.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.43.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.43.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.44.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.44.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.44.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.44.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.44.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.44.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.44.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.44.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.44.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.45.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.45.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.45.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.45.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.45.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.45.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.45.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.45.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.45.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.46.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.46.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.46.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.46.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.46.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.46.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.46.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.46.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.46.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.47.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.47.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.47.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.47.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.47.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.47.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.47.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.47.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.47.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.48.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.48.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.48.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.48.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.48.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.48.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.48.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.48.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.48.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.49.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.49.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.49.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.49.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.49.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.49.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.49.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.49.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.49.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.5.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.5.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.5.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.5.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.5.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.5.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.5.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.5.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.5.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.50.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.50.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.50.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.50.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.50.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.50.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.50.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.50.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.50.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.51.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.51.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.51.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.51.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.51.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.51.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.51.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.51.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.51.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.52.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.52.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.52.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.52.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.52.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.52.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.52.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.52.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.52.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.53.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.53.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.53.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.53.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.53.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.53.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.53.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.53.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.53.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.54.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.54.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.54.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.54.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.54.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.54.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.54.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.54.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.54.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.55.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.55.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.55.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.55.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.55.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.55.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.55.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.55.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.55.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.56.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.56.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.56.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.56.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.56.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.56.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.56.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.56.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.56.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.57.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.57.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.57.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.57.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.57.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.57.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.57.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.57.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.57.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.58.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.58.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.58.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.58.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.58.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.58.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.58.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.58.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.58.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.59.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.59.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.59.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.59.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.59.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.59.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.59.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.59.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.59.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.6.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.6.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.6.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.6.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.6.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.6.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.6.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.6.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.6.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.60.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.60.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.60.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.60.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.60.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.60.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.60.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.60.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.60.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.61.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.61.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.61.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.61.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.61.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.61.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.61.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.61.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.61.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.62.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.62.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.62.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.62.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.62.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.62.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.62.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.62.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.62.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.63.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.63.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.63.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.63.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.63.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.63.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.63.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.63.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.63.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.64.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.64.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.64.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.64.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.64.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.64.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.64.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.64.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.64.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.65.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.65.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.65.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.65.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.65.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.65.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.65.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.65.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.65.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.66.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.66.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.66.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.66.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.66.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.66.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.66.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.66.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.66.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.67.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.67.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.67.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.67.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.67.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.67.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.67.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.67.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.67.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.68.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.68.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.68.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.68.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.68.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.68.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.68.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.68.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.68.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.69.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.69.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.69.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.69.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.69.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.69.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.69.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.69.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.69.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.7.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.7.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.7.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.7.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.7.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.7.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.7.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.7.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.7.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.70.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.70.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.70.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.70.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.70.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.70.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.70.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.70.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.70.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.71.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.71.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.71.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.71.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.71.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.71.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.71.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.71.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.71.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.72.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.72.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.72.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.72.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.72.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.72.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.72.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.72.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.72.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.73.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.73.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.73.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.73.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.73.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.73.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.73.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.73.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.73.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.74.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.74.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.74.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.74.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.74.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.74.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.74.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.74.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.74.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.75.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.75.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.75.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.75.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.75.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.75.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.75.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.75.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.75.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.76.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.76.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.76.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.76.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.76.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.76.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.76.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.76.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.76.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.77.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.77.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.77.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.77.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.77.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.77.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.77.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.77.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.77.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.78.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.78.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.78.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.78.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.78.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.78.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.78.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.78.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.78.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.79.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.79.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.79.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.79.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.79.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.79.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.79.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.79.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.79.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.8.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.8.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.8.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.8.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.8.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.8.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.8.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.8.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.8.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.80.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.80.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.80.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.80.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.80.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.80.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.80.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.80.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.80.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.81.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.81.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.81.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.81.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.81.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.81.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.81.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.81.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.81.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.82.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.82.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.82.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.82.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.82.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.82.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.82.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.82.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.82.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.83.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.83.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.83.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.83.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.83.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.83.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.83.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.83.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.83.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.84.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.84.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.84.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.84.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.84.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.84.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.84.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.84.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.84.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.85.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.85.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.85.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.85.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.85.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.85.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.85.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.85.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.85.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.86.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.86.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.86.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.86.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.86.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.86.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.86.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.86.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.86.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.87.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.87.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.87.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.87.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.87.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.87.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.87.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.87.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.87.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.88.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.88.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.88.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.88.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.88.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.88.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.88.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.88.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.88.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.89.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.89.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.89.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.89.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.89.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.89.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.89.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.89.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.89.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.9.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.9.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.9.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.9.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.9.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.9.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.9.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.9.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.9.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.90.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.90.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.90.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.90.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.90.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.90.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.90.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.90.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.90.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.91.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.91.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.91.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.91.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.91.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.91.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.91.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.91.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.91.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.92.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.92.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.92.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.92.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.92.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.92.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.92.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.92.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.92.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.93.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.93.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.93.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.93.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.93.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.93.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.93.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.93.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.93.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.94.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.94.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.94.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.94.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.94.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.94.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.94.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.94.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.94.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.95.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.95.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.95.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.95.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.95.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.95.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.95.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.95.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.95.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.96.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.96.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.96.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.96.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.96.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.96.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.96.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.96.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.96.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.97.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.97.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.97.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.97.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.97.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.97.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.97.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.97.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.97.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.98.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.98.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.98.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.98.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.98.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.98.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.98.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.98.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.98.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.99.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.99.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.99.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.99.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.99.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.99.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.99.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.experts.99.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.experts.99.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.ffn_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.22.gate.weight": "consolidated-00006-of-00013.safetensors", "layers.22.shared_experts.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.shared_experts.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.shared_experts.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.shared_experts.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.shared_experts.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.shared_experts.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.22.shared_experts.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.22.shared_experts.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.22.shared_experts.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.attention.kv_a_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.23.attention.q_a_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.23.attention.wkv_a_with_mqa.weight": "consolidated-00006-of-00013.safetensors", "layers.23.attention.wkv_b.weight": "consolidated-00006-of-00013.safetensors", "layers.23.attention.wo.weight": "consolidated-00006-of-00013.safetensors", "layers.23.attention.wq_a.weight": "consolidated-00006-of-00013.safetensors", "layers.23.attention.wq_b.weight": "consolidated-00006-of-00013.safetensors", "layers.23.attention_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.23.experts.0.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.0.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.0.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.0.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.0.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.0.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.0.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.0.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.0.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.1.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.1.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.1.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.1.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.1.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.1.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.1.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.1.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.1.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.10.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.10.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.10.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.10.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.10.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.10.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.10.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.10.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.10.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.100.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.100.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.100.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.100.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.100.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.100.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.100.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.100.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.100.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.101.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.101.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.101.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.101.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.101.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.101.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.101.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.101.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.101.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.102.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.102.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.102.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.102.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.102.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.102.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.102.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.102.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.102.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.103.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.103.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.103.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.103.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.103.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.103.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.103.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.103.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.103.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.104.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.104.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.104.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.104.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.104.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.104.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.104.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.104.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.104.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.105.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.105.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.105.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.105.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.105.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.105.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.105.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.105.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.105.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.106.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.106.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.106.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.106.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.106.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.106.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.106.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.106.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.106.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.107.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.107.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.107.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.107.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.107.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.107.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.107.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.107.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.107.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.108.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.108.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.108.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.108.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.108.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.108.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.108.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.108.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.108.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.109.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.109.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.109.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.109.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.109.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.109.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.109.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.109.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.109.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.11.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.11.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.11.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.11.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.11.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.11.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.11.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.11.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.11.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.110.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.110.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.110.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.110.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.110.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.110.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.110.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.110.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.110.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.111.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.111.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.111.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.111.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.111.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.111.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.111.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.111.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.111.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.112.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.112.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.112.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.112.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.112.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.112.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.112.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.112.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.112.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.113.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.113.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.113.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.113.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.113.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.113.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.113.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.113.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.113.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.114.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.114.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.114.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.114.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.114.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.114.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.114.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.114.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.114.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.115.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.115.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.115.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.115.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.115.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.115.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.115.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.115.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.115.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.116.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.116.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.116.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.116.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.116.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.116.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.116.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.116.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.116.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.117.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.117.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.117.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.117.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.117.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.117.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.117.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.117.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.117.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.118.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.118.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.118.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.118.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.118.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.118.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.118.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.118.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.118.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.119.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.119.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.119.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.119.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.119.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.119.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.119.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.119.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.119.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.12.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.12.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.12.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.12.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.12.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.12.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.12.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.12.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.12.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.120.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.120.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.120.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.120.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.120.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.120.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.120.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.120.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.120.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.121.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.121.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.121.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.121.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.121.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.121.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.121.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.121.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.121.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.122.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.122.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.122.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.122.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.122.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.122.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.122.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.122.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.122.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.123.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.123.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.123.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.123.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.123.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.123.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.123.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.123.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.123.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.124.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.124.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.124.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.124.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.124.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.124.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.124.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.124.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.124.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.125.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.125.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.125.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.125.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.125.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.125.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.125.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.125.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.125.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.126.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.126.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.126.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.126.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.126.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.126.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.126.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.126.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.126.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.127.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.127.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.127.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.127.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.127.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.127.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.127.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.127.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.127.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.13.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.13.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.13.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.13.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.13.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.13.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.13.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.13.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.13.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.14.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.14.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.14.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.14.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.14.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.14.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.14.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.14.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.14.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.15.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.15.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.15.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.15.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.15.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.15.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.15.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.15.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.15.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.16.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.16.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.16.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.16.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.16.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.16.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.16.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.16.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.16.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.17.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.17.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.17.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.17.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.17.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.17.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.17.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.17.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.17.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.18.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.18.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.18.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.18.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.18.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.18.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.18.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.18.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.18.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.19.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.19.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.19.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.19.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.19.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.19.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.19.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.19.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.19.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.2.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.2.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.2.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.2.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.2.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.2.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.2.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.2.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.2.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.20.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.20.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.20.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.20.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.20.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.20.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.20.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.20.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.20.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.21.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.21.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.21.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.21.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.21.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.21.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.21.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.21.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.21.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.22.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.22.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.22.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.22.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.22.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.22.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.22.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.22.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.22.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.23.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.23.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.23.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.23.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.23.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.23.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.23.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.23.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.23.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.24.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.24.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.24.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.24.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.24.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.24.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.24.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.24.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.24.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.25.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.25.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.25.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.25.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.25.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.25.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.25.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.25.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.25.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.26.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.26.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.26.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.26.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.26.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.26.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.26.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.26.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.26.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.27.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.27.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.27.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.27.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.27.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.27.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.27.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.27.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.27.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.28.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.28.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.28.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.28.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.28.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.28.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.28.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.28.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.28.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.29.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.29.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.29.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.29.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.29.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.29.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.29.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.29.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.29.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.3.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.3.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.3.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.3.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.3.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.3.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.3.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.3.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.3.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.30.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.30.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.30.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.30.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.30.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.30.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.30.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.30.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.30.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.31.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.31.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.31.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.31.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.31.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.31.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.31.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.31.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.31.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.32.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.32.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.32.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.32.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.32.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.32.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.32.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.32.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.32.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.33.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.33.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.33.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.33.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.33.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.33.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.33.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.33.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.33.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.34.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.34.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.34.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.34.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.34.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.34.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.34.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.34.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.34.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.35.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.35.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.35.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.35.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.35.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.35.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.35.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.35.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.35.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.36.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.36.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.36.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.36.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.36.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.36.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.36.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.36.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.36.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.37.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.37.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.37.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.37.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.37.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.37.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.37.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.37.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.37.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.38.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.38.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.38.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.38.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.38.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.38.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.38.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.38.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.38.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.39.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.39.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.39.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.39.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.39.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.39.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.39.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.39.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.39.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.4.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.4.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.4.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.4.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.4.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.4.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.4.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.4.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.4.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.40.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.40.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.40.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.40.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.40.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.40.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.40.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.40.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.40.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.41.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.41.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.41.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.41.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.41.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.41.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.41.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.41.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.41.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.42.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.42.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.42.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.42.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.42.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.42.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.42.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.42.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.42.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.43.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.43.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.43.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.43.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.43.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.43.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.43.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.43.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.43.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.44.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.44.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.44.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.44.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.44.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.44.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.44.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.44.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.44.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.45.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.45.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.45.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.45.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.45.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.45.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.45.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.45.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.45.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.46.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.46.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.46.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.46.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.46.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.46.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.46.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.46.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.46.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.47.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.47.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.47.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.47.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.47.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.47.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.47.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.47.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.47.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.48.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.48.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.48.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.48.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.48.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.48.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.48.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.48.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.48.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.49.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.49.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.49.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.49.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.49.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.49.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.49.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.49.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.49.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.5.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.5.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.5.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.5.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.5.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.5.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.5.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.5.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.5.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.50.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.50.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.50.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.50.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.50.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.50.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.50.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.50.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.50.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.51.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.51.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.51.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.51.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.51.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.51.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.51.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.51.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.51.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.52.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.52.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.52.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.52.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.52.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.52.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.52.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.52.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.52.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.53.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.53.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.53.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.53.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.53.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.53.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.53.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.53.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.53.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.54.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.54.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.54.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.54.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.54.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.54.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.54.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.54.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.54.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.55.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.55.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.55.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.55.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.55.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.55.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.55.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.55.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.55.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.56.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.56.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.56.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.56.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.56.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.56.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.56.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.56.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.56.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.57.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.57.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.57.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.57.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.57.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.57.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.57.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.57.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.57.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.58.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.58.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.58.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.58.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.58.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.58.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.58.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.58.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.58.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.59.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.59.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.59.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.59.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.59.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.59.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.59.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.59.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.59.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.6.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.6.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.6.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.6.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.6.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.6.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.6.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.6.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.6.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.60.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.60.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.60.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.60.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.60.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.60.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.60.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.60.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.60.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.61.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.61.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.61.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.61.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.61.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.61.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.61.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.61.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.61.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.62.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.62.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.62.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.62.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.62.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.62.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.62.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.62.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.62.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.63.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.63.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.63.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.63.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.63.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.63.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.63.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.63.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.63.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.64.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.64.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.64.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.64.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.64.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.64.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.64.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.64.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.64.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.65.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.65.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.65.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.65.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.65.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.65.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.65.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.65.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.65.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.66.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.66.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.66.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.66.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.66.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.66.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.66.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.66.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.66.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.67.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.67.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.67.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.67.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.67.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.67.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.67.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.67.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.67.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.68.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.68.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.68.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.68.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.68.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.68.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.68.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.68.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.68.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.69.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.69.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.69.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.69.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.69.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.69.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.69.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.69.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.69.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.7.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.7.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.7.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.7.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.7.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.7.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.7.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.7.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.7.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.70.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.70.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.70.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.70.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.70.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.70.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.70.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.70.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.70.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.71.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.71.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.71.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.71.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.71.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.71.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.71.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.71.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.71.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.72.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.72.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.72.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.72.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.72.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.72.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.72.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.72.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.72.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.73.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.73.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.73.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.73.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.73.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.73.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.73.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.73.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.73.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.74.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.74.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.74.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.74.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.74.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.74.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.74.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.74.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.74.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.75.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.75.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.75.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.75.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.75.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.75.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.75.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.75.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.75.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.76.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.76.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.76.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.76.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.76.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.76.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.76.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.76.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.76.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.77.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.77.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.77.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.77.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.77.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.77.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.77.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.77.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.77.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.78.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.78.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.78.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.78.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.78.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.78.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.78.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.78.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.78.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.79.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.79.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.79.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.79.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.79.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.79.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.79.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.79.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.79.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.8.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.8.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.8.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.8.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.8.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.8.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.8.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.8.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.8.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.80.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.80.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.80.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.80.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.80.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.80.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.80.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.80.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.80.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.81.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.81.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.81.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.81.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.81.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.81.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.81.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.81.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.81.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.82.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.82.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.82.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.82.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.82.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.82.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.82.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.82.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.82.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.83.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.83.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.83.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.83.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.83.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.83.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.83.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.83.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.83.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.84.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.84.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.84.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.84.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.84.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.84.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.84.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.84.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.84.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.85.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.85.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.85.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.85.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.85.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.85.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.85.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.85.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.85.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.86.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.86.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.86.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.86.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.86.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.86.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.86.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.86.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.86.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.87.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.87.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.87.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.87.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.87.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.87.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.87.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.87.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.87.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.88.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.88.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.88.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.88.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.88.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.88.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.88.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.88.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.88.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.89.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.89.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.89.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.89.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.89.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.89.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.89.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.89.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.89.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.9.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.9.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.9.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.9.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.9.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.9.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.9.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.9.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.9.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.90.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.90.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.90.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.90.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.90.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.90.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.90.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.90.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.90.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.91.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.91.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.91.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.91.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.91.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.91.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.91.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.91.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.91.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.92.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.92.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.92.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.92.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.92.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.92.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.92.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.92.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.92.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.93.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.93.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.93.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.93.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.93.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.93.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.93.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.93.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.93.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.94.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.94.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.94.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.94.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.94.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.94.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.94.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.94.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.94.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.95.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.95.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.95.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.95.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.95.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.95.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.95.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.95.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.95.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.96.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.96.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.96.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.96.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.96.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.96.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.96.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.96.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.96.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.97.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.97.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.97.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.97.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.97.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.97.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.97.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.97.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.97.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.98.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.98.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.98.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.98.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.98.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.98.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.98.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.98.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.98.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.99.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.99.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.99.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.99.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.99.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.99.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.99.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.experts.99.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.experts.99.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.ffn_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.23.gate.weight": "consolidated-00006-of-00013.safetensors", "layers.23.shared_experts.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.shared_experts.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.shared_experts.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.shared_experts.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.shared_experts.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.shared_experts.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.23.shared_experts.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.23.shared_experts.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.23.shared_experts.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.attention.kv_a_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.24.attention.q_a_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.24.attention.wkv_a_with_mqa.weight": "consolidated-00006-of-00013.safetensors", "layers.24.attention.wkv_b.weight": "consolidated-00006-of-00013.safetensors", "layers.24.attention.wo.weight": "consolidated-00006-of-00013.safetensors", "layers.24.attention.wq_a.weight": "consolidated-00006-of-00013.safetensors", "layers.24.attention.wq_b.weight": "consolidated-00006-of-00013.safetensors", "layers.24.attention_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.24.experts.0.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.0.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.0.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.0.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.0.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.0.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.0.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.0.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.0.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.1.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.1.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.1.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.1.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.1.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.1.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.1.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.1.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.1.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.10.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.10.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.10.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.10.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.10.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.10.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.10.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.10.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.10.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.100.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.100.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.100.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.100.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.100.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.100.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.100.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.100.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.100.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.101.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.101.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.101.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.101.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.101.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.101.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.101.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.101.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.101.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.102.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.102.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.102.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.102.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.102.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.102.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.102.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.102.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.102.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.103.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.103.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.103.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.103.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.103.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.103.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.103.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.103.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.103.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.104.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.104.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.104.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.104.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.104.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.104.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.104.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.104.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.104.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.105.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.105.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.105.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.105.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.105.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.105.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.105.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.105.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.105.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.106.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.106.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.106.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.106.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.106.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.106.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.106.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.106.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.106.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.107.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.107.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.107.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.107.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.107.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.107.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.107.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.107.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.107.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.108.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.108.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.108.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.108.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.108.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.108.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.108.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.108.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.108.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.109.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.109.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.109.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.109.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.109.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.109.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.109.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.109.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.109.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.11.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.11.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.11.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.11.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.11.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.11.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.11.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.11.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.11.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.110.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.110.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.110.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.110.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.110.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.110.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.110.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.110.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.110.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.111.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.111.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.111.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.111.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.111.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.111.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.111.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.111.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.111.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.112.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.112.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.112.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.112.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.112.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.112.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.112.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.112.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.112.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.113.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.113.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.113.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.113.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.113.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.113.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.113.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.113.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.113.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.114.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.114.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.114.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.114.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.114.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.114.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.114.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.114.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.114.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.115.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.115.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.115.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.115.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.115.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.115.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.115.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.115.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.115.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.116.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.116.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.116.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.116.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.116.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.116.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.116.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.116.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.116.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.117.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.117.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.117.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.117.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.117.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.117.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.117.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.117.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.117.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.118.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.118.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.118.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.118.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.118.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.118.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.118.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.118.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.118.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.119.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.119.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.119.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.119.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.119.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.119.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.119.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.119.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.119.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.12.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.12.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.12.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.12.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.12.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.12.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.12.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.12.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.12.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.120.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.120.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.120.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.120.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.120.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.120.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.120.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.120.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.120.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.121.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.121.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.121.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.121.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.121.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.121.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.121.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.121.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.121.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.122.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.122.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.122.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.122.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.122.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.122.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.122.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.122.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.122.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.123.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.123.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.123.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.123.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.123.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.123.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.123.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.123.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.123.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.124.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.124.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.124.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.124.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.124.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.124.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.124.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.124.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.124.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.125.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.125.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.125.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.125.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.125.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.125.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.125.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.125.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.125.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.126.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.126.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.126.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.126.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.126.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.126.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.126.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.126.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.126.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.127.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.127.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.127.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.127.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.127.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.127.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.127.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.127.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.127.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.13.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.13.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.13.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.13.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.13.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.13.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.13.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.13.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.13.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.14.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.14.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.14.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.14.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.14.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.14.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.14.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.14.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.14.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.15.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.15.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.15.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.15.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.15.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.15.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.15.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.15.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.15.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.16.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.16.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.16.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.16.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.16.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.16.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.16.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.16.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.16.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.17.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.17.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.17.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.17.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.17.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.17.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.17.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.17.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.17.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.18.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.18.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.18.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.18.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.18.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.18.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.18.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.18.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.18.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.19.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.19.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.19.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.19.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.19.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.19.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.19.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.19.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.19.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.2.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.2.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.2.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.2.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.2.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.2.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.2.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.2.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.2.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.20.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.20.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.20.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.20.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.20.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.20.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.20.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.20.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.20.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.21.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.21.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.21.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.21.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.21.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.21.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.21.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.21.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.21.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.22.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.22.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.22.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.22.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.22.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.22.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.22.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.22.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.22.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.23.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.23.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.23.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.23.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.23.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.23.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.23.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.23.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.23.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.24.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.24.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.24.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.24.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.24.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.24.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.24.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.24.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.24.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.25.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.25.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.25.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.25.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.25.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.25.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.25.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.25.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.25.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.26.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.26.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.26.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.26.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.26.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.26.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.26.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.26.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.26.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.27.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.27.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.27.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.27.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.27.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.27.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.27.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.27.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.27.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.28.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.28.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.28.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.28.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.28.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.28.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.28.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.28.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.28.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.29.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.29.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.29.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.29.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.29.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.29.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.29.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.29.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.29.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.3.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.3.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.3.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.3.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.3.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.3.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.3.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.3.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.3.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.30.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.30.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.30.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.30.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.30.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.30.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.30.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.30.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.30.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.31.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.31.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.31.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.31.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.31.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.31.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.31.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.31.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.31.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.32.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.32.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.32.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.32.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.32.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.32.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.32.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.32.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.32.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.33.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.33.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.33.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.33.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.33.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.33.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.33.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.33.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.33.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.34.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.34.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.34.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.34.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.34.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.34.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.34.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.34.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.34.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.35.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.35.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.35.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.35.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.35.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.35.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.35.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.35.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.35.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.36.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.36.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.36.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.36.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.36.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.36.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.36.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.36.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.36.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.37.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.37.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.37.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.37.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.37.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.37.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.37.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.37.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.37.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.38.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.38.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.38.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.38.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.38.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.38.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.38.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.38.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.38.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.39.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.39.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.39.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.39.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.39.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.39.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.39.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.39.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.39.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.4.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.4.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.4.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.4.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.4.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.4.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.4.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.4.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.4.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.40.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.40.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.40.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.40.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.40.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.40.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.40.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.40.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.40.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.41.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.41.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.41.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.41.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.41.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.41.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.41.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.41.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.41.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.42.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.42.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.42.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.42.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.42.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.42.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.42.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.42.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.42.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.43.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.43.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.43.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.43.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.43.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.43.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.43.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.43.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.43.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.44.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.44.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.44.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.44.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.44.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.44.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.44.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.44.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.44.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.45.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.45.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.45.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.45.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.45.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.45.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.45.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.45.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.45.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.46.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.46.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.46.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.46.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.46.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.46.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.46.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.46.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.46.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.47.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.47.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.47.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.47.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.47.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.47.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.47.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.47.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.47.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.48.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.48.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.48.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.48.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.48.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.48.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.48.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.48.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.48.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.49.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.49.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.49.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.49.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.49.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.49.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.49.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.49.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.49.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.5.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.5.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.5.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.5.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.5.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.5.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.5.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.5.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.5.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.50.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.50.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.50.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.50.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.50.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.50.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.50.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.50.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.50.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.51.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.51.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.51.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.51.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.51.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.51.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.51.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.51.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.51.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.52.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.52.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.52.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.52.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.52.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.52.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.52.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.52.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.52.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.53.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.53.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.53.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.53.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.53.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.53.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.53.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.53.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.53.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.54.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.54.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.54.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.54.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.54.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.54.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.54.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.54.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.54.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.55.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.55.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.55.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.55.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.55.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.55.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.55.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.55.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.55.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.56.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.56.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.56.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.56.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.56.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.56.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.56.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.56.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.56.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.57.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.57.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.57.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.57.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.57.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.57.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.57.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.57.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.57.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.58.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.58.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.58.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.58.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.58.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.58.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.58.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.58.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.58.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.59.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.59.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.59.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.59.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.59.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.59.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.59.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.59.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.59.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.6.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.6.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.6.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.6.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.6.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.6.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.6.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.6.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.6.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.60.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.60.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.60.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.60.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.60.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.60.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.60.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.60.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.60.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.61.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.61.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.61.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.61.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.61.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.61.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.61.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.61.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.61.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.62.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.62.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.62.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.62.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.62.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.62.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.62.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.62.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.62.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.63.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.63.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.63.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.63.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.63.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.63.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.63.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.63.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.63.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.64.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.64.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.64.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.64.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.64.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.64.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.64.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.64.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.64.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.65.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.65.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.65.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.65.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.65.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.65.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.65.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.65.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.65.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.66.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.66.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.66.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.66.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.66.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.66.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.66.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.66.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.66.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.67.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.67.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.67.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.67.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.67.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.67.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.67.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.67.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.67.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.68.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.68.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.68.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.68.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.68.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.68.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.68.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.68.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.68.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.69.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.69.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.69.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.69.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.69.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.69.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.69.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.69.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.69.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.7.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.7.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.7.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.7.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.7.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.7.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.7.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.7.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.7.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.70.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.70.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.70.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.70.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.70.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.70.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.70.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.70.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.70.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.71.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.71.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.71.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.71.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.71.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.71.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.71.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.71.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.71.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.72.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.72.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.72.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.72.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.72.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.72.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.72.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.72.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.72.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.73.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.73.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.73.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.73.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.73.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.73.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.73.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.73.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.73.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.74.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.74.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.74.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.74.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.74.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.74.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.74.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.74.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.74.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.75.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.75.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.75.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.75.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.75.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.75.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.75.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.75.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.75.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.76.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.76.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.76.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.76.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.76.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.76.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.76.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.76.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.76.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.77.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.77.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.77.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.77.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.77.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.77.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.77.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.77.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.77.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.78.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.78.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.78.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.78.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.78.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.78.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.78.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.78.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.78.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.79.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.79.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.79.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.79.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.79.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.79.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.79.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.79.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.79.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.8.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.8.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.8.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.8.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.8.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.8.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.8.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.8.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.8.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.80.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.80.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.80.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.80.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.80.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.80.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.80.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.80.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.80.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.81.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.81.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.81.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.81.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.81.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.81.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.81.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.81.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.81.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.82.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.82.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.82.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.82.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.82.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.82.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.82.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.82.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.82.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.83.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.83.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.83.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.83.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.83.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.83.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.83.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.83.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.83.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.84.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.84.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.84.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.84.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.84.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.84.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.84.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.84.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.84.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.85.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.85.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.85.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.85.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.85.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.85.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.85.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.85.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.85.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.86.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.86.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.86.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.86.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.86.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.86.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.86.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.86.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.86.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.87.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.87.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.87.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.87.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.87.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.87.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.87.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.87.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.87.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.88.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.88.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.88.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.88.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.88.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.88.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.88.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.88.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.88.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.89.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.89.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.89.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.89.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.89.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.89.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.89.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.89.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.89.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.9.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.9.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.9.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.9.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.9.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.9.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.9.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.9.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.9.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.90.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.90.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.90.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.90.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.90.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.90.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.90.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.90.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.90.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.91.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.91.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.91.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.91.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.91.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.91.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.91.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.91.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.91.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.92.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.92.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.92.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.92.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.92.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.92.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.92.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.92.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.92.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.93.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.93.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.93.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.93.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.93.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.93.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.93.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.93.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.93.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.94.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.94.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.94.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.94.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.94.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.94.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.94.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.94.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.94.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.95.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.95.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.95.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.95.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.95.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.95.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.95.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.95.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.95.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.96.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.96.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.96.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.96.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.96.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.96.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.96.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.96.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.96.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.97.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.97.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.97.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.97.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.97.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.97.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.97.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.97.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.97.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.98.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.98.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.98.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.98.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.98.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.98.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.98.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.98.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.98.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.99.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.99.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.99.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.99.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.99.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.99.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.99.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.experts.99.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.experts.99.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.ffn_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.24.gate.weight": "consolidated-00006-of-00013.safetensors", "layers.24.shared_experts.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.shared_experts.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.shared_experts.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.shared_experts.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.shared_experts.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.shared_experts.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.24.shared_experts.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.24.shared_experts.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.24.shared_experts.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.attention.kv_a_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.25.attention.q_a_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.25.attention.wkv_a_with_mqa.weight": "consolidated-00006-of-00013.safetensors", "layers.25.attention.wkv_b.weight": "consolidated-00006-of-00013.safetensors", "layers.25.attention.wo.weight": "consolidated-00006-of-00013.safetensors", "layers.25.attention.wq_a.weight": "consolidated-00006-of-00013.safetensors", "layers.25.attention.wq_b.weight": "consolidated-00006-of-00013.safetensors", "layers.25.attention_norm.weight": "consolidated-00006-of-00013.safetensors", "layers.25.experts.0.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.0.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.0.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.0.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.0.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.0.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.0.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.0.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.0.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.1.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.1.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.1.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.1.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.1.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.1.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.1.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.1.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.1.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.10.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.10.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.10.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.10.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.10.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.10.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.10.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.10.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.10.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.100.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.100.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.100.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.100.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.100.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.100.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.100.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.100.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.100.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.101.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.101.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.101.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.101.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.101.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.101.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.101.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.101.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.101.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.102.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.102.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.102.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.102.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.102.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.102.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.102.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.102.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.102.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.103.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.103.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.103.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.103.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.103.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.103.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.103.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.103.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.103.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.104.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.104.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.104.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.104.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.104.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.104.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.104.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.104.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.104.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.105.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.105.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.105.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.105.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.105.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.105.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.105.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.105.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.105.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.106.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.106.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.106.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.106.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.106.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.106.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.106.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.106.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.106.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.107.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.107.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.107.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.107.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.107.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.107.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.107.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.107.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.107.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.108.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.108.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.108.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.108.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.108.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.108.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.108.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.108.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.108.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.109.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.109.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.109.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.109.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.109.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.109.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.109.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.109.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.109.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.11.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.11.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.11.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.11.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.11.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.11.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.11.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.11.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.11.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.110.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.110.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.110.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.110.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.110.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.110.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.110.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.110.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.110.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.111.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.111.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.111.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.111.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.111.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.111.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.111.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.111.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.111.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.112.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.112.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.112.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.112.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.112.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.112.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.112.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.112.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.112.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.113.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.113.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.113.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.113.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.113.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.113.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.113.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.113.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.113.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.114.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.114.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.114.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.114.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.114.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.114.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.114.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.114.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.114.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.115.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.115.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.115.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.115.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.115.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.115.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.115.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.115.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.115.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.116.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.116.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.116.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.116.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.116.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.116.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.116.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.116.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.116.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.117.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.117.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.117.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.117.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.117.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.117.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.117.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.117.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.117.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.118.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.118.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.118.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.118.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.118.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.118.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.118.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.118.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.118.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.119.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.119.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.119.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.119.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.119.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.119.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.119.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.119.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.119.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.12.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.12.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.12.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.12.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.12.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.12.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.12.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.12.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.12.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.120.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.120.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.120.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.120.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.120.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.120.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.120.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.120.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.120.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.121.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.121.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.121.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.121.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.121.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.121.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.121.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.121.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.121.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.122.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.122.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.122.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.122.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.122.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.122.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.122.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.122.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.122.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.123.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.123.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.123.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.123.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.123.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.123.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.123.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.123.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.123.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.124.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.124.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.124.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.124.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.124.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.124.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.124.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.124.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.124.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.125.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.125.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.125.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.125.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.125.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.125.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.125.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.125.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.125.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.126.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.126.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.126.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.126.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.126.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.126.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.126.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.126.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.126.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.127.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.127.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.127.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.127.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.127.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.127.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.127.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.127.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.127.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.13.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.13.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.13.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.13.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.13.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.13.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.13.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.13.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.13.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.14.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.14.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.14.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.14.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.14.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.14.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.14.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.14.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.14.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.15.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.15.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.15.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.15.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.15.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.15.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.15.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.15.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.15.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.16.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.16.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.16.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.16.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.16.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.16.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.16.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.16.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.16.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.17.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.17.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.17.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.17.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.17.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.17.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.17.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.17.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.17.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.18.w1.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.18.w1.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.18.w1.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.18.w2.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.18.w2.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.18.w2.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.18.w3.weight_global_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.18.w3.weight_packed": "consolidated-00006-of-00013.safetensors", "layers.25.experts.18.w3.weight_scale": "consolidated-00006-of-00013.safetensors", "layers.25.experts.19.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.19.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.19.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.19.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.19.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.19.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.19.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.19.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.19.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.2.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.2.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.2.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.2.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.2.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.2.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.2.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.2.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.2.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.20.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.20.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.20.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.20.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.20.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.20.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.20.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.20.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.20.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.21.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.21.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.21.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.21.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.21.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.21.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.21.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.21.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.21.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.22.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.22.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.22.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.22.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.22.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.22.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.22.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.22.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.22.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.23.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.23.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.23.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.23.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.23.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.23.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.23.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.23.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.23.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.24.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.24.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.24.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.24.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.24.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.24.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.24.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.24.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.24.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.25.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.25.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.25.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.25.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.25.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.25.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.25.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.25.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.25.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.26.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.26.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.26.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.26.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.26.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.26.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.26.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.26.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.26.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.27.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.27.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.27.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.27.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.27.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.27.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.27.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.27.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.27.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.28.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.28.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.28.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.28.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.28.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.28.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.28.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.28.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.28.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.29.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.29.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.29.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.29.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.29.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.29.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.29.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.29.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.29.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.3.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.3.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.3.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.3.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.3.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.3.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.3.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.3.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.3.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.30.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.30.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.30.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.30.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.30.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.30.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.30.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.30.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.30.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.31.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.31.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.31.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.31.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.31.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.31.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.31.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.31.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.31.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.32.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.32.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.32.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.32.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.32.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.32.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.32.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.32.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.32.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.33.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.33.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.33.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.33.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.33.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.33.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.33.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.33.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.33.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.34.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.34.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.34.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.34.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.34.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.34.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.34.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.34.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.34.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.35.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.35.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.35.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.35.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.35.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.35.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.35.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.35.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.35.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.36.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.36.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.36.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.36.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.36.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.36.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.36.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.36.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.36.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.37.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.37.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.37.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.37.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.37.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.37.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.37.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.37.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.37.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.38.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.38.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.38.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.38.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.38.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.38.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.38.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.38.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.38.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.39.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.39.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.39.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.39.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.39.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.39.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.39.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.39.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.39.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.4.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.4.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.4.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.4.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.4.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.4.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.4.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.4.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.4.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.40.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.40.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.40.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.40.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.40.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.40.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.40.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.40.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.40.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.41.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.41.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.41.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.41.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.41.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.41.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.41.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.41.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.41.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.42.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.42.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.42.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.42.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.42.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.42.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.42.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.42.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.42.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.43.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.43.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.43.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.43.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.43.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.43.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.43.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.43.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.43.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.44.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.44.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.44.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.44.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.44.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.44.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.44.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.44.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.44.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.45.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.45.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.45.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.45.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.45.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.45.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.45.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.45.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.45.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.46.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.46.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.46.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.46.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.46.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.46.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.46.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.46.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.46.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.47.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.47.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.47.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.47.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.47.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.47.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.47.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.47.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.47.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.48.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.48.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.48.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.48.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.48.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.48.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.48.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.48.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.48.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.49.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.49.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.49.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.49.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.49.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.49.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.49.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.49.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.49.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.5.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.5.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.5.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.5.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.5.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.5.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.5.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.5.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.5.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.50.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.50.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.50.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.50.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.50.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.50.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.50.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.50.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.50.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.51.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.51.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.51.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.51.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.51.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.51.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.51.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.51.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.51.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.52.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.52.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.52.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.52.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.52.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.52.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.52.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.52.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.52.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.53.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.53.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.53.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.53.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.53.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.53.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.53.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.53.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.53.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.54.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.54.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.54.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.54.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.54.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.54.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.54.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.54.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.54.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.55.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.55.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.55.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.55.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.55.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.55.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.55.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.55.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.55.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.56.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.56.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.56.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.56.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.56.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.56.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.56.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.56.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.56.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.57.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.57.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.57.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.57.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.57.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.57.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.57.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.57.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.57.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.58.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.58.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.58.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.58.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.58.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.58.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.58.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.58.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.58.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.59.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.59.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.59.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.59.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.59.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.59.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.59.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.59.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.59.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.6.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.6.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.6.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.6.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.6.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.6.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.6.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.6.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.6.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.60.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.60.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.60.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.60.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.60.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.60.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.60.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.60.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.60.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.61.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.61.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.61.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.61.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.61.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.61.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.61.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.61.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.61.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.62.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.62.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.62.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.62.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.62.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.62.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.62.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.62.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.62.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.63.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.63.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.63.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.63.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.63.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.63.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.63.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.63.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.63.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.64.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.64.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.64.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.64.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.64.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.64.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.64.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.64.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.64.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.65.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.65.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.65.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.65.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.65.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.65.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.65.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.65.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.65.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.66.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.66.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.66.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.66.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.66.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.66.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.66.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.66.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.66.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.67.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.67.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.67.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.67.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.67.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.67.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.67.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.67.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.67.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.68.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.68.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.68.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.68.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.68.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.68.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.68.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.68.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.68.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.69.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.69.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.69.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.69.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.69.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.69.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.69.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.69.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.69.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.7.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.7.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.7.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.7.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.7.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.7.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.7.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.7.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.7.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.70.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.70.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.70.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.70.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.70.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.70.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.70.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.70.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.70.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.71.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.71.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.71.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.71.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.71.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.71.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.71.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.71.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.71.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.72.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.72.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.72.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.72.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.72.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.72.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.72.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.72.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.72.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.73.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.73.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.73.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.73.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.73.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.73.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.73.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.73.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.73.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.74.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.74.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.74.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.74.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.74.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.74.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.74.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.74.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.74.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.75.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.75.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.75.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.75.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.75.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.75.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.75.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.75.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.75.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.76.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.76.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.76.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.76.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.76.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.76.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.76.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.76.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.76.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.77.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.77.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.77.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.77.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.77.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.77.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.77.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.77.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.77.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.78.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.78.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.78.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.78.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.78.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.78.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.78.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.78.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.78.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.79.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.79.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.79.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.79.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.79.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.79.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.79.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.79.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.79.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.8.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.8.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.8.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.8.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.8.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.8.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.8.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.8.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.8.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.80.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.80.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.80.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.80.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.80.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.80.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.80.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.80.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.80.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.81.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.81.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.81.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.81.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.81.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.81.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.81.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.81.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.81.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.82.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.82.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.82.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.82.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.82.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.82.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.82.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.82.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.82.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.83.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.83.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.83.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.83.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.83.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.83.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.83.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.83.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.83.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.84.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.84.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.84.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.84.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.84.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.84.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.84.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.84.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.84.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.85.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.85.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.85.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.85.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.85.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.85.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.85.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.85.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.85.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.86.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.86.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.86.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.86.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.86.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.86.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.86.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.86.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.86.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.87.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.87.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.87.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.87.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.87.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.87.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.87.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.87.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.87.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.88.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.88.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.88.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.88.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.88.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.88.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.88.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.88.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.88.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.89.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.89.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.89.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.89.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.89.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.89.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.89.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.89.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.89.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.9.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.9.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.9.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.9.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.9.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.9.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.9.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.9.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.9.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.90.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.90.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.90.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.90.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.90.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.90.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.90.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.90.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.90.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.91.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.91.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.91.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.91.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.91.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.91.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.91.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.91.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.91.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.92.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.92.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.92.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.92.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.92.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.92.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.92.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.92.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.92.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.93.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.93.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.93.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.93.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.93.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.93.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.93.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.93.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.93.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.94.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.94.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.94.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.94.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.94.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.94.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.94.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.94.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.94.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.95.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.95.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.95.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.95.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.95.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.95.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.95.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.95.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.95.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.96.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.96.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.96.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.96.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.96.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.96.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.96.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.96.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.96.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.97.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.97.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.97.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.97.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.97.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.97.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.97.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.97.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.97.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.98.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.98.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.98.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.98.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.98.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.98.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.98.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.98.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.98.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.99.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.99.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.99.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.99.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.99.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.99.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.99.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.experts.99.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.experts.99.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.ffn_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.25.gate.weight": "consolidated-00007-of-00013.safetensors", "layers.25.shared_experts.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.shared_experts.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.shared_experts.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.shared_experts.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.shared_experts.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.shared_experts.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.25.shared_experts.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.25.shared_experts.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.25.shared_experts.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.attention.kv_a_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.26.attention.q_a_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.26.attention.wkv_a_with_mqa.weight": "consolidated-00007-of-00013.safetensors", "layers.26.attention.wkv_b.weight": "consolidated-00007-of-00013.safetensors", "layers.26.attention.wo.weight": "consolidated-00007-of-00013.safetensors", "layers.26.attention.wq_a.weight": "consolidated-00007-of-00013.safetensors", "layers.26.attention.wq_b.weight": "consolidated-00007-of-00013.safetensors", "layers.26.attention_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.26.experts.0.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.0.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.0.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.0.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.0.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.0.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.0.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.0.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.0.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.1.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.1.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.1.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.1.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.1.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.1.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.1.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.1.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.1.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.10.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.10.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.10.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.10.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.10.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.10.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.10.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.10.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.10.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.100.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.100.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.100.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.100.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.100.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.100.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.100.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.100.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.100.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.101.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.101.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.101.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.101.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.101.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.101.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.101.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.101.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.101.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.102.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.102.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.102.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.102.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.102.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.102.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.102.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.102.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.102.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.103.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.103.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.103.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.103.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.103.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.103.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.103.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.103.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.103.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.104.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.104.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.104.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.104.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.104.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.104.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.104.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.104.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.104.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.105.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.105.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.105.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.105.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.105.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.105.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.105.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.105.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.105.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.106.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.106.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.106.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.106.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.106.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.106.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.106.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.106.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.106.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.107.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.107.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.107.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.107.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.107.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.107.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.107.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.107.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.107.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.108.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.108.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.108.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.108.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.108.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.108.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.108.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.108.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.108.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.109.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.109.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.109.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.109.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.109.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.109.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.109.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.109.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.109.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.11.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.11.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.11.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.11.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.11.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.11.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.11.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.11.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.11.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.110.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.110.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.110.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.110.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.110.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.110.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.110.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.110.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.110.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.111.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.111.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.111.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.111.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.111.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.111.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.111.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.111.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.111.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.112.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.112.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.112.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.112.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.112.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.112.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.112.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.112.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.112.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.113.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.113.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.113.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.113.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.113.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.113.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.113.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.113.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.113.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.114.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.114.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.114.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.114.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.114.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.114.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.114.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.114.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.114.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.115.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.115.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.115.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.115.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.115.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.115.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.115.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.115.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.115.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.116.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.116.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.116.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.116.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.116.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.116.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.116.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.116.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.116.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.117.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.117.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.117.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.117.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.117.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.117.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.117.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.117.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.117.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.118.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.118.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.118.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.118.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.118.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.118.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.118.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.118.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.118.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.119.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.119.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.119.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.119.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.119.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.119.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.119.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.119.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.119.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.12.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.12.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.12.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.12.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.12.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.12.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.12.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.12.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.12.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.120.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.120.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.120.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.120.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.120.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.120.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.120.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.120.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.120.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.121.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.121.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.121.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.121.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.121.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.121.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.121.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.121.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.121.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.122.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.122.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.122.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.122.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.122.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.122.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.122.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.122.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.122.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.123.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.123.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.123.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.123.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.123.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.123.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.123.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.123.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.123.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.124.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.124.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.124.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.124.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.124.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.124.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.124.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.124.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.124.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.125.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.125.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.125.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.125.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.125.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.125.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.125.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.125.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.125.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.126.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.126.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.126.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.126.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.126.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.126.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.126.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.126.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.126.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.127.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.127.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.127.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.127.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.127.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.127.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.127.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.127.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.127.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.13.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.13.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.13.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.13.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.13.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.13.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.13.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.13.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.13.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.14.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.14.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.14.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.14.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.14.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.14.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.14.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.14.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.14.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.15.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.15.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.15.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.15.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.15.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.15.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.15.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.15.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.15.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.16.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.16.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.16.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.16.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.16.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.16.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.16.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.16.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.16.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.17.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.17.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.17.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.17.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.17.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.17.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.17.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.17.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.17.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.18.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.18.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.18.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.18.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.18.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.18.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.18.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.18.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.18.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.19.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.19.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.19.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.19.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.19.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.19.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.19.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.19.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.19.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.2.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.2.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.2.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.2.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.2.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.2.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.2.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.2.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.2.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.20.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.20.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.20.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.20.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.20.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.20.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.20.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.20.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.20.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.21.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.21.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.21.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.21.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.21.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.21.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.21.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.21.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.21.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.22.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.22.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.22.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.22.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.22.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.22.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.22.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.22.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.22.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.23.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.23.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.23.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.23.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.23.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.23.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.23.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.23.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.23.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.24.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.24.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.24.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.24.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.24.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.24.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.24.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.24.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.24.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.25.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.25.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.25.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.25.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.25.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.25.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.25.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.25.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.25.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.26.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.26.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.26.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.26.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.26.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.26.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.26.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.26.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.26.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.27.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.27.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.27.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.27.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.27.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.27.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.27.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.27.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.27.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.28.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.28.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.28.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.28.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.28.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.28.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.28.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.28.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.28.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.29.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.29.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.29.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.29.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.29.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.29.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.29.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.29.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.29.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.3.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.3.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.3.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.3.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.3.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.3.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.3.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.3.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.3.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.30.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.30.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.30.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.30.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.30.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.30.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.30.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.30.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.30.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.31.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.31.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.31.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.31.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.31.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.31.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.31.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.31.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.31.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.32.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.32.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.32.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.32.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.32.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.32.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.32.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.32.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.32.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.33.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.33.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.33.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.33.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.33.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.33.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.33.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.33.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.33.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.34.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.34.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.34.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.34.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.34.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.34.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.34.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.34.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.34.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.35.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.35.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.35.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.35.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.35.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.35.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.35.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.35.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.35.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.36.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.36.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.36.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.36.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.36.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.36.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.36.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.36.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.36.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.37.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.37.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.37.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.37.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.37.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.37.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.37.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.37.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.37.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.38.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.38.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.38.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.38.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.38.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.38.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.38.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.38.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.38.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.39.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.39.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.39.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.39.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.39.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.39.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.39.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.39.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.39.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.4.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.4.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.4.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.4.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.4.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.4.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.4.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.4.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.4.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.40.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.40.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.40.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.40.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.40.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.40.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.40.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.40.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.40.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.41.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.41.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.41.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.41.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.41.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.41.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.41.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.41.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.41.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.42.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.42.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.42.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.42.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.42.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.42.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.42.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.42.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.42.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.43.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.43.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.43.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.43.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.43.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.43.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.43.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.43.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.43.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.44.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.44.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.44.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.44.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.44.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.44.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.44.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.44.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.44.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.45.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.45.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.45.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.45.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.45.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.45.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.45.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.45.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.45.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.46.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.46.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.46.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.46.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.46.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.46.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.46.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.46.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.46.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.47.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.47.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.47.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.47.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.47.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.47.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.47.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.47.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.47.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.48.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.48.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.48.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.48.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.48.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.48.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.48.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.48.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.48.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.49.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.49.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.49.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.49.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.49.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.49.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.49.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.49.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.49.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.5.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.5.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.5.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.5.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.5.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.5.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.5.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.5.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.5.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.50.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.50.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.50.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.50.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.50.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.50.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.50.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.50.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.50.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.51.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.51.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.51.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.51.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.51.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.51.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.51.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.51.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.51.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.52.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.52.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.52.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.52.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.52.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.52.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.52.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.52.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.52.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.53.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.53.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.53.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.53.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.53.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.53.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.53.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.53.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.53.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.54.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.54.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.54.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.54.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.54.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.54.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.54.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.54.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.54.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.55.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.55.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.55.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.55.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.55.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.55.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.55.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.55.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.55.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.56.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.56.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.56.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.56.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.56.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.56.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.56.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.56.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.56.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.57.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.57.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.57.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.57.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.57.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.57.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.57.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.57.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.57.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.58.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.58.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.58.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.58.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.58.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.58.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.58.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.58.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.58.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.59.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.59.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.59.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.59.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.59.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.59.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.59.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.59.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.59.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.6.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.6.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.6.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.6.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.6.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.6.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.6.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.6.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.6.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.60.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.60.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.60.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.60.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.60.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.60.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.60.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.60.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.60.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.61.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.61.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.61.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.61.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.61.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.61.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.61.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.61.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.61.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.62.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.62.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.62.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.62.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.62.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.62.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.62.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.62.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.62.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.63.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.63.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.63.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.63.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.63.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.63.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.63.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.63.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.63.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.64.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.64.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.64.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.64.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.64.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.64.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.64.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.64.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.64.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.65.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.65.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.65.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.65.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.65.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.65.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.65.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.65.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.65.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.66.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.66.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.66.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.66.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.66.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.66.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.66.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.66.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.66.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.67.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.67.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.67.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.67.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.67.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.67.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.67.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.67.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.67.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.68.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.68.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.68.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.68.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.68.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.68.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.68.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.68.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.68.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.69.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.69.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.69.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.69.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.69.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.69.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.69.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.69.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.69.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.7.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.7.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.7.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.7.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.7.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.7.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.7.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.7.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.7.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.70.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.70.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.70.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.70.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.70.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.70.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.70.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.70.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.70.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.71.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.71.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.71.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.71.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.71.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.71.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.71.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.71.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.71.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.72.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.72.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.72.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.72.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.72.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.72.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.72.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.72.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.72.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.73.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.73.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.73.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.73.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.73.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.73.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.73.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.73.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.73.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.74.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.74.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.74.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.74.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.74.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.74.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.74.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.74.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.74.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.75.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.75.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.75.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.75.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.75.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.75.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.75.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.75.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.75.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.76.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.76.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.76.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.76.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.76.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.76.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.76.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.76.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.76.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.77.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.77.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.77.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.77.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.77.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.77.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.77.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.77.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.77.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.78.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.78.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.78.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.78.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.78.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.78.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.78.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.78.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.78.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.79.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.79.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.79.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.79.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.79.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.79.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.79.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.79.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.79.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.8.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.8.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.8.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.8.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.8.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.8.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.8.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.8.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.8.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.80.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.80.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.80.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.80.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.80.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.80.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.80.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.80.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.80.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.81.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.81.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.81.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.81.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.81.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.81.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.81.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.81.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.81.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.82.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.82.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.82.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.82.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.82.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.82.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.82.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.82.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.82.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.83.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.83.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.83.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.83.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.83.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.83.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.83.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.83.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.83.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.84.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.84.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.84.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.84.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.84.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.84.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.84.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.84.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.84.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.85.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.85.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.85.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.85.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.85.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.85.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.85.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.85.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.85.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.86.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.86.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.86.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.86.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.86.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.86.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.86.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.86.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.86.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.87.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.87.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.87.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.87.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.87.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.87.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.87.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.87.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.87.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.88.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.88.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.88.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.88.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.88.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.88.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.88.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.88.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.88.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.89.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.89.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.89.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.89.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.89.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.89.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.89.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.89.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.89.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.9.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.9.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.9.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.9.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.9.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.9.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.9.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.9.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.9.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.90.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.90.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.90.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.90.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.90.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.90.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.90.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.90.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.90.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.91.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.91.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.91.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.91.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.91.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.91.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.91.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.91.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.91.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.92.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.92.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.92.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.92.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.92.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.92.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.92.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.92.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.92.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.93.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.93.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.93.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.93.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.93.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.93.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.93.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.93.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.93.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.94.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.94.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.94.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.94.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.94.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.94.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.94.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.94.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.94.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.95.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.95.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.95.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.95.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.95.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.95.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.95.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.95.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.95.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.96.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.96.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.96.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.96.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.96.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.96.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.96.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.96.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.96.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.97.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.97.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.97.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.97.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.97.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.97.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.97.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.97.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.97.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.98.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.98.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.98.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.98.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.98.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.98.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.98.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.98.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.98.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.99.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.99.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.99.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.99.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.99.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.99.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.99.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.experts.99.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.experts.99.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.ffn_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.26.gate.weight": "consolidated-00007-of-00013.safetensors", "layers.26.shared_experts.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.shared_experts.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.shared_experts.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.shared_experts.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.shared_experts.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.shared_experts.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.26.shared_experts.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.26.shared_experts.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.26.shared_experts.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.attention.kv_a_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.27.attention.q_a_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.27.attention.wkv_a_with_mqa.weight": "consolidated-00007-of-00013.safetensors", "layers.27.attention.wkv_b.weight": "consolidated-00007-of-00013.safetensors", "layers.27.attention.wo.weight": "consolidated-00007-of-00013.safetensors", "layers.27.attention.wq_a.weight": "consolidated-00007-of-00013.safetensors", "layers.27.attention.wq_b.weight": "consolidated-00007-of-00013.safetensors", "layers.27.attention_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.27.experts.0.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.0.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.0.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.0.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.0.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.0.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.0.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.0.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.0.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.1.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.1.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.1.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.1.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.1.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.1.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.1.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.1.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.1.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.10.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.10.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.10.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.10.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.10.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.10.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.10.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.10.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.10.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.100.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.100.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.100.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.100.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.100.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.100.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.100.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.100.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.100.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.101.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.101.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.101.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.101.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.101.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.101.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.101.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.101.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.101.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.102.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.102.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.102.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.102.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.102.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.102.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.102.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.102.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.102.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.103.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.103.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.103.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.103.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.103.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.103.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.103.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.103.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.103.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.104.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.104.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.104.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.104.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.104.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.104.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.104.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.104.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.104.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.105.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.105.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.105.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.105.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.105.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.105.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.105.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.105.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.105.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.106.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.106.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.106.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.106.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.106.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.106.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.106.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.106.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.106.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.107.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.107.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.107.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.107.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.107.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.107.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.107.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.107.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.107.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.108.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.108.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.108.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.108.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.108.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.108.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.108.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.108.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.108.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.109.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.109.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.109.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.109.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.109.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.109.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.109.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.109.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.109.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.11.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.11.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.11.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.11.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.11.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.11.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.11.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.11.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.11.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.110.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.110.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.110.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.110.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.110.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.110.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.110.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.110.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.110.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.111.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.111.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.111.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.111.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.111.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.111.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.111.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.111.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.111.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.112.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.112.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.112.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.112.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.112.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.112.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.112.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.112.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.112.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.113.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.113.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.113.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.113.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.113.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.113.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.113.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.113.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.113.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.114.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.114.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.114.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.114.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.114.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.114.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.114.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.114.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.114.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.115.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.115.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.115.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.115.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.115.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.115.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.115.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.115.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.115.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.116.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.116.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.116.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.116.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.116.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.116.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.116.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.116.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.116.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.117.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.117.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.117.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.117.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.117.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.117.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.117.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.117.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.117.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.118.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.118.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.118.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.118.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.118.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.118.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.118.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.118.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.118.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.119.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.119.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.119.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.119.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.119.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.119.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.119.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.119.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.119.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.12.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.12.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.12.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.12.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.12.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.12.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.12.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.12.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.12.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.120.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.120.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.120.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.120.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.120.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.120.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.120.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.120.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.120.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.121.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.121.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.121.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.121.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.121.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.121.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.121.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.121.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.121.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.122.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.122.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.122.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.122.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.122.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.122.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.122.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.122.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.122.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.123.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.123.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.123.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.123.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.123.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.123.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.123.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.123.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.123.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.124.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.124.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.124.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.124.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.124.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.124.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.124.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.124.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.124.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.125.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.125.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.125.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.125.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.125.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.125.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.125.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.125.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.125.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.126.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.126.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.126.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.126.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.126.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.126.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.126.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.126.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.126.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.127.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.127.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.127.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.127.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.127.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.127.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.127.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.127.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.127.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.13.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.13.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.13.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.13.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.13.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.13.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.13.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.13.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.13.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.14.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.14.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.14.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.14.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.14.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.14.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.14.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.14.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.14.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.15.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.15.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.15.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.15.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.15.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.15.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.15.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.15.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.15.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.16.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.16.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.16.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.16.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.16.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.16.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.16.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.16.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.16.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.17.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.17.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.17.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.17.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.17.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.17.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.17.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.17.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.17.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.18.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.18.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.18.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.18.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.18.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.18.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.18.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.18.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.18.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.19.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.19.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.19.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.19.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.19.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.19.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.19.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.19.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.19.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.2.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.2.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.2.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.2.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.2.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.2.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.2.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.2.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.2.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.20.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.20.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.20.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.20.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.20.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.20.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.20.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.20.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.20.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.21.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.21.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.21.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.21.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.21.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.21.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.21.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.21.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.21.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.22.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.22.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.22.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.22.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.22.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.22.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.22.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.22.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.22.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.23.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.23.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.23.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.23.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.23.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.23.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.23.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.23.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.23.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.24.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.24.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.24.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.24.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.24.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.24.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.24.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.24.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.24.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.25.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.25.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.25.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.25.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.25.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.25.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.25.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.25.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.25.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.26.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.26.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.26.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.26.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.26.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.26.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.26.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.26.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.26.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.27.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.27.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.27.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.27.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.27.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.27.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.27.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.27.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.27.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.28.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.28.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.28.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.28.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.28.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.28.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.28.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.28.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.28.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.29.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.29.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.29.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.29.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.29.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.29.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.29.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.29.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.29.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.3.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.3.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.3.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.3.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.3.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.3.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.3.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.3.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.3.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.30.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.30.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.30.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.30.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.30.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.30.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.30.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.30.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.30.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.31.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.31.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.31.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.31.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.31.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.31.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.31.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.31.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.31.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.32.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.32.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.32.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.32.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.32.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.32.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.32.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.32.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.32.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.33.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.33.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.33.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.33.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.33.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.33.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.33.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.33.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.33.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.34.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.34.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.34.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.34.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.34.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.34.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.34.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.34.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.34.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.35.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.35.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.35.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.35.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.35.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.35.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.35.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.35.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.35.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.36.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.36.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.36.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.36.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.36.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.36.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.36.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.36.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.36.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.37.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.37.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.37.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.37.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.37.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.37.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.37.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.37.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.37.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.38.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.38.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.38.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.38.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.38.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.38.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.38.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.38.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.38.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.39.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.39.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.39.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.39.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.39.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.39.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.39.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.39.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.39.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.4.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.4.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.4.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.4.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.4.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.4.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.4.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.4.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.4.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.40.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.40.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.40.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.40.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.40.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.40.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.40.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.40.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.40.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.41.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.41.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.41.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.41.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.41.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.41.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.41.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.41.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.41.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.42.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.42.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.42.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.42.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.42.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.42.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.42.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.42.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.42.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.43.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.43.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.43.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.43.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.43.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.43.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.43.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.43.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.43.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.44.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.44.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.44.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.44.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.44.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.44.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.44.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.44.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.44.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.45.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.45.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.45.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.45.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.45.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.45.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.45.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.45.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.45.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.46.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.46.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.46.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.46.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.46.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.46.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.46.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.46.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.46.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.47.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.47.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.47.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.47.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.47.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.47.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.47.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.47.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.47.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.48.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.48.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.48.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.48.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.48.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.48.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.48.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.48.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.48.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.49.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.49.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.49.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.49.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.49.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.49.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.49.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.49.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.49.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.5.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.5.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.5.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.5.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.5.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.5.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.5.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.5.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.5.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.50.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.50.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.50.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.50.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.50.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.50.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.50.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.50.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.50.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.51.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.51.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.51.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.51.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.51.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.51.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.51.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.51.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.51.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.52.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.52.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.52.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.52.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.52.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.52.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.52.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.52.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.52.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.53.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.53.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.53.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.53.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.53.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.53.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.53.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.53.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.53.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.54.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.54.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.54.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.54.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.54.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.54.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.54.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.54.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.54.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.55.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.55.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.55.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.55.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.55.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.55.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.55.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.55.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.55.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.56.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.56.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.56.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.56.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.56.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.56.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.56.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.56.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.56.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.57.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.57.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.57.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.57.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.57.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.57.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.57.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.57.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.57.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.58.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.58.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.58.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.58.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.58.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.58.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.58.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.58.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.58.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.59.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.59.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.59.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.59.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.59.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.59.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.59.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.59.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.59.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.6.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.6.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.6.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.6.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.6.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.6.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.6.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.6.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.6.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.60.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.60.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.60.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.60.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.60.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.60.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.60.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.60.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.60.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.61.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.61.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.61.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.61.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.61.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.61.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.61.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.61.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.61.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.62.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.62.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.62.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.62.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.62.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.62.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.62.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.62.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.62.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.63.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.63.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.63.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.63.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.63.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.63.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.63.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.63.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.63.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.64.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.64.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.64.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.64.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.64.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.64.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.64.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.64.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.64.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.65.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.65.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.65.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.65.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.65.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.65.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.65.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.65.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.65.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.66.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.66.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.66.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.66.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.66.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.66.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.66.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.66.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.66.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.67.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.67.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.67.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.67.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.67.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.67.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.67.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.67.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.67.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.68.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.68.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.68.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.68.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.68.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.68.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.68.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.68.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.68.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.69.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.69.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.69.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.69.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.69.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.69.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.69.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.69.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.69.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.7.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.7.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.7.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.7.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.7.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.7.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.7.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.7.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.7.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.70.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.70.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.70.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.70.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.70.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.70.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.70.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.70.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.70.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.71.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.71.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.71.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.71.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.71.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.71.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.71.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.71.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.71.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.72.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.72.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.72.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.72.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.72.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.72.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.72.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.72.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.72.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.73.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.73.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.73.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.73.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.73.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.73.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.73.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.73.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.73.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.74.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.74.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.74.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.74.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.74.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.74.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.74.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.74.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.74.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.75.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.75.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.75.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.75.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.75.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.75.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.75.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.75.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.75.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.76.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.76.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.76.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.76.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.76.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.76.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.76.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.76.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.76.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.77.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.77.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.77.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.77.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.77.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.77.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.77.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.77.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.77.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.78.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.78.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.78.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.78.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.78.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.78.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.78.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.78.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.78.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.79.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.79.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.79.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.79.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.79.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.79.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.79.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.79.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.79.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.8.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.8.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.8.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.8.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.8.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.8.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.8.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.8.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.8.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.80.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.80.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.80.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.80.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.80.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.80.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.80.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.80.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.80.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.81.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.81.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.81.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.81.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.81.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.81.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.81.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.81.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.81.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.82.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.82.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.82.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.82.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.82.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.82.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.82.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.82.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.82.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.83.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.83.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.83.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.83.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.83.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.83.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.83.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.83.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.83.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.84.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.84.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.84.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.84.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.84.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.84.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.84.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.84.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.84.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.85.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.85.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.85.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.85.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.85.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.85.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.85.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.85.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.85.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.86.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.86.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.86.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.86.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.86.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.86.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.86.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.86.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.86.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.87.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.87.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.87.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.87.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.87.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.87.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.87.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.87.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.87.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.88.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.88.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.88.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.88.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.88.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.88.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.88.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.88.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.88.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.89.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.89.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.89.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.89.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.89.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.89.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.89.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.89.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.89.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.9.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.9.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.9.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.9.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.9.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.9.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.9.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.9.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.9.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.90.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.90.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.90.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.90.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.90.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.90.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.90.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.90.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.90.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.91.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.91.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.91.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.91.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.91.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.91.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.91.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.91.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.91.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.92.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.92.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.92.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.92.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.92.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.92.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.92.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.92.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.92.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.93.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.93.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.93.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.93.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.93.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.93.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.93.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.93.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.93.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.94.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.94.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.94.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.94.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.94.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.94.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.94.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.94.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.94.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.95.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.95.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.95.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.95.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.95.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.95.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.95.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.95.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.95.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.96.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.96.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.96.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.96.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.96.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.96.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.96.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.96.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.96.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.97.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.97.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.97.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.97.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.97.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.97.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.97.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.97.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.97.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.98.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.98.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.98.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.98.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.98.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.98.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.98.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.98.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.98.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.99.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.99.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.99.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.99.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.99.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.99.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.99.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.experts.99.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.experts.99.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.ffn_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.27.gate.weight": "consolidated-00007-of-00013.safetensors", "layers.27.shared_experts.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.shared_experts.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.shared_experts.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.shared_experts.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.shared_experts.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.shared_experts.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.27.shared_experts.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.27.shared_experts.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.27.shared_experts.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.attention.kv_a_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.28.attention.q_a_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.28.attention.wkv_a_with_mqa.weight": "consolidated-00007-of-00013.safetensors", "layers.28.attention.wkv_b.weight": "consolidated-00007-of-00013.safetensors", "layers.28.attention.wo.weight": "consolidated-00007-of-00013.safetensors", "layers.28.attention.wq_a.weight": "consolidated-00007-of-00013.safetensors", "layers.28.attention.wq_b.weight": "consolidated-00007-of-00013.safetensors", "layers.28.attention_norm.weight": "consolidated-00007-of-00013.safetensors", "layers.28.experts.0.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.0.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.0.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.0.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.0.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.0.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.0.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.0.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.0.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.1.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.1.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.1.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.1.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.1.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.1.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.1.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.1.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.1.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.10.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.10.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.10.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.10.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.10.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.10.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.10.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.10.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.10.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.100.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.100.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.100.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.100.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.100.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.100.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.100.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.100.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.100.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.101.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.101.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.101.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.101.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.101.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.101.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.101.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.101.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.101.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.102.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.102.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.102.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.102.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.102.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.102.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.102.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.102.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.102.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.103.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.103.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.103.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.103.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.103.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.103.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.103.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.103.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.103.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.104.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.104.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.104.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.104.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.104.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.104.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.104.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.104.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.104.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.105.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.105.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.105.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.105.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.105.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.105.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.105.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.105.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.105.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.106.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.106.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.106.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.106.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.106.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.106.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.106.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.106.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.106.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.107.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.107.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.107.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.107.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.107.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.107.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.107.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.107.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.107.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.108.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.108.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.108.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.108.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.108.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.108.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.108.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.108.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.108.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.109.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.109.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.109.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.109.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.109.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.109.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.109.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.109.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.109.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.11.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.11.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.11.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.11.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.11.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.11.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.11.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.11.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.11.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.110.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.110.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.110.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.110.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.110.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.110.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.110.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.110.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.110.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.111.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.111.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.111.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.111.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.111.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.111.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.111.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.111.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.111.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.112.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.112.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.112.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.112.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.112.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.112.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.112.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.112.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.112.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.113.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.113.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.113.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.113.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.113.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.113.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.113.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.113.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.113.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.114.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.114.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.114.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.114.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.114.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.114.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.114.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.114.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.114.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.115.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.115.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.115.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.115.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.115.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.115.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.115.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.115.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.115.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.116.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.116.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.116.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.116.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.116.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.116.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.116.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.116.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.116.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.117.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.117.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.117.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.117.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.117.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.117.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.117.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.117.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.117.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.118.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.118.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.118.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.118.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.118.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.118.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.118.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.118.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.118.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.119.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.119.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.119.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.119.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.119.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.119.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.119.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.119.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.119.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.12.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.12.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.12.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.12.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.12.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.12.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.12.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.12.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.12.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.120.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.120.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.120.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.120.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.120.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.120.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.120.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.120.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.120.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.121.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.121.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.121.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.121.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.121.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.121.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.121.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.121.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.121.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.122.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.122.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.122.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.122.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.122.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.122.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.122.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.122.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.122.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.123.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.123.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.123.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.123.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.123.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.123.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.123.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.123.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.123.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.124.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.124.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.124.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.124.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.124.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.124.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.124.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.124.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.124.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.125.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.125.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.125.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.125.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.125.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.125.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.125.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.125.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.125.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.126.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.126.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.126.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.126.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.126.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.126.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.126.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.126.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.126.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.127.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.127.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.127.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.127.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.127.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.127.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.127.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.127.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.127.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.13.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.13.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.13.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.13.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.13.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.13.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.13.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.13.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.13.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.14.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.14.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.14.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.14.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.14.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.14.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.14.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.14.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.14.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.15.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.15.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.15.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.15.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.15.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.15.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.15.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.15.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.15.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.16.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.16.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.16.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.16.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.16.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.16.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.16.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.16.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.16.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.17.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.17.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.17.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.17.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.17.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.17.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.17.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.17.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.17.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.18.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.18.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.18.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.18.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.18.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.18.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.18.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.18.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.18.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.19.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.19.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.19.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.19.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.19.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.19.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.19.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.19.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.19.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.2.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.2.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.2.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.2.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.2.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.2.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.2.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.2.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.2.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.20.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.20.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.20.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.20.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.20.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.20.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.20.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.20.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.20.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.21.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.21.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.21.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.21.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.21.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.21.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.21.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.21.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.21.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.22.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.22.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.22.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.22.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.22.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.22.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.22.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.22.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.22.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.23.w1.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.23.w1.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.23.w1.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.23.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.23.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.23.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.23.w3.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.23.w3.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.23.w3.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.24.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.24.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.24.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.24.w2.weight_global_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.24.w2.weight_packed": "consolidated-00007-of-00013.safetensors", "layers.28.experts.24.w2.weight_scale": "consolidated-00007-of-00013.safetensors", "layers.28.experts.24.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.24.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.24.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.25.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.25.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.25.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.25.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.25.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.25.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.25.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.25.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.25.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.26.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.26.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.26.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.26.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.26.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.26.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.26.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.26.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.26.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.27.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.27.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.27.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.27.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.27.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.27.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.27.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.27.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.27.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.28.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.28.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.28.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.28.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.28.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.28.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.28.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.28.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.28.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.29.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.29.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.29.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.29.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.29.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.29.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.29.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.29.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.29.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.3.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.3.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.3.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.3.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.3.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.3.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.3.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.3.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.3.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.30.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.30.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.30.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.30.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.30.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.30.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.30.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.30.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.30.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.31.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.31.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.31.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.31.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.31.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.31.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.31.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.31.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.31.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.32.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.32.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.32.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.32.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.32.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.32.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.32.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.32.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.32.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.33.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.33.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.33.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.33.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.33.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.33.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.33.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.33.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.33.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.34.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.34.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.34.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.34.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.34.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.34.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.34.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.34.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.34.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.35.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.35.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.35.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.35.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.35.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.35.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.35.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.35.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.35.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.36.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.36.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.36.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.36.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.36.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.36.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.36.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.36.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.36.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.37.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.37.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.37.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.37.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.37.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.37.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.37.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.37.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.37.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.38.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.38.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.38.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.38.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.38.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.38.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.38.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.38.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.38.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.39.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.39.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.39.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.39.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.39.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.39.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.39.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.39.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.39.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.4.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.4.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.4.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.4.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.4.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.4.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.4.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.4.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.4.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.40.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.40.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.40.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.40.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.40.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.40.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.40.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.40.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.40.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.41.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.41.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.41.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.41.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.41.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.41.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.41.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.41.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.41.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.42.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.42.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.42.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.42.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.42.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.42.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.42.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.42.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.42.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.43.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.43.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.43.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.43.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.43.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.43.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.43.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.43.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.43.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.44.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.44.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.44.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.44.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.44.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.44.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.44.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.44.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.44.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.45.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.45.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.45.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.45.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.45.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.45.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.45.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.45.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.45.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.46.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.46.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.46.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.46.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.46.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.46.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.46.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.46.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.46.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.47.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.47.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.47.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.47.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.47.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.47.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.47.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.47.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.47.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.48.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.48.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.48.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.48.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.48.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.48.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.48.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.48.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.48.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.49.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.49.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.49.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.49.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.49.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.49.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.49.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.49.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.49.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.5.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.5.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.5.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.5.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.5.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.5.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.5.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.5.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.5.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.50.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.50.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.50.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.50.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.50.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.50.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.50.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.50.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.50.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.51.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.51.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.51.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.51.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.51.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.51.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.51.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.51.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.51.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.52.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.52.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.52.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.52.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.52.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.52.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.52.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.52.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.52.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.53.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.53.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.53.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.53.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.53.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.53.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.53.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.53.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.53.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.54.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.54.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.54.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.54.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.54.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.54.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.54.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.54.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.54.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.55.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.55.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.55.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.55.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.55.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.55.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.55.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.55.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.55.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.56.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.56.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.56.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.56.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.56.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.56.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.56.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.56.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.56.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.57.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.57.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.57.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.57.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.57.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.57.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.57.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.57.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.57.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.58.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.58.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.58.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.58.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.58.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.58.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.58.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.58.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.58.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.59.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.59.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.59.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.59.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.59.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.59.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.59.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.59.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.59.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.6.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.6.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.6.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.6.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.6.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.6.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.6.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.6.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.6.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.60.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.60.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.60.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.60.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.60.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.60.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.60.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.60.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.60.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.61.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.61.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.61.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.61.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.61.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.61.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.61.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.61.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.61.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.62.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.62.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.62.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.62.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.62.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.62.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.62.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.62.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.62.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.63.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.63.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.63.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.63.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.63.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.63.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.63.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.63.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.63.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.64.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.64.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.64.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.64.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.64.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.64.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.64.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.64.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.64.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.65.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.65.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.65.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.65.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.65.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.65.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.65.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.65.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.65.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.66.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.66.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.66.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.66.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.66.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.66.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.66.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.66.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.66.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.67.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.67.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.67.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.67.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.67.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.67.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.67.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.67.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.67.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.68.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.68.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.68.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.68.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.68.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.68.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.68.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.68.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.68.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.69.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.69.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.69.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.69.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.69.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.69.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.69.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.69.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.69.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.7.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.7.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.7.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.7.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.7.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.7.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.7.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.7.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.7.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.70.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.70.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.70.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.70.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.70.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.70.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.70.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.70.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.70.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.71.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.71.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.71.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.71.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.71.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.71.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.71.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.71.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.71.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.72.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.72.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.72.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.72.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.72.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.72.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.72.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.72.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.72.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.73.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.73.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.73.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.73.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.73.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.73.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.73.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.73.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.73.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.74.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.74.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.74.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.74.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.74.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.74.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.74.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.74.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.74.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.75.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.75.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.75.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.75.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.75.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.75.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.75.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.75.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.75.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.76.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.76.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.76.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.76.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.76.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.76.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.76.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.76.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.76.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.77.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.77.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.77.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.77.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.77.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.77.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.77.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.77.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.77.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.78.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.78.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.78.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.78.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.78.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.78.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.78.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.78.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.78.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.79.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.79.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.79.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.79.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.79.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.79.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.79.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.79.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.79.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.8.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.8.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.8.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.8.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.8.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.8.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.8.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.8.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.8.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.80.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.80.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.80.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.80.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.80.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.80.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.80.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.80.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.80.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.81.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.81.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.81.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.81.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.81.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.81.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.81.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.81.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.81.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.82.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.82.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.82.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.82.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.82.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.82.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.82.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.82.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.82.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.83.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.83.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.83.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.83.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.83.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.83.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.83.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.83.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.83.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.84.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.84.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.84.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.84.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.84.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.84.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.84.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.84.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.84.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.85.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.85.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.85.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.85.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.85.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.85.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.85.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.85.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.85.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.86.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.86.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.86.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.86.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.86.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.86.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.86.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.86.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.86.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.87.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.87.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.87.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.87.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.87.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.87.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.87.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.87.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.87.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.88.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.88.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.88.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.88.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.88.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.88.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.88.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.88.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.88.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.89.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.89.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.89.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.89.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.89.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.89.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.89.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.89.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.89.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.9.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.9.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.9.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.9.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.9.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.9.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.9.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.9.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.9.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.90.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.90.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.90.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.90.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.90.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.90.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.90.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.90.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.90.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.91.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.91.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.91.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.91.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.91.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.91.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.91.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.91.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.91.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.92.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.92.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.92.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.92.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.92.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.92.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.92.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.92.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.92.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.93.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.93.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.93.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.93.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.93.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.93.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.93.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.93.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.93.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.94.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.94.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.94.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.94.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.94.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.94.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.94.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.94.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.94.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.95.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.95.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.95.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.95.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.95.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.95.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.95.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.95.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.95.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.96.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.96.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.96.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.96.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.96.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.96.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.96.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.96.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.96.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.97.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.97.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.97.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.97.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.97.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.97.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.97.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.97.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.97.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.98.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.98.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.98.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.98.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.98.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.98.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.98.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.98.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.98.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.99.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.99.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.99.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.99.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.99.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.99.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.99.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.experts.99.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.experts.99.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.ffn_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.28.gate.weight": "consolidated-00008-of-00013.safetensors", "layers.28.shared_experts.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.shared_experts.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.shared_experts.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.shared_experts.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.shared_experts.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.shared_experts.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.28.shared_experts.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.28.shared_experts.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.28.shared_experts.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.attention.kv_a_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.29.attention.q_a_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.29.attention.wkv_a_with_mqa.weight": "consolidated-00008-of-00013.safetensors", "layers.29.attention.wkv_b.weight": "consolidated-00008-of-00013.safetensors", "layers.29.attention.wo.weight": "consolidated-00008-of-00013.safetensors", "layers.29.attention.wq_a.weight": "consolidated-00008-of-00013.safetensors", "layers.29.attention.wq_b.weight": "consolidated-00008-of-00013.safetensors", "layers.29.attention_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.29.experts.0.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.0.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.0.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.0.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.0.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.0.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.0.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.0.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.0.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.1.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.1.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.1.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.1.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.1.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.1.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.1.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.1.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.1.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.10.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.10.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.10.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.10.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.10.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.10.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.10.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.10.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.10.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.100.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.100.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.100.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.100.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.100.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.100.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.100.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.100.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.100.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.101.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.101.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.101.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.101.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.101.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.101.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.101.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.101.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.101.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.102.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.102.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.102.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.102.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.102.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.102.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.102.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.102.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.102.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.103.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.103.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.103.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.103.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.103.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.103.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.103.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.103.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.103.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.104.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.104.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.104.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.104.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.104.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.104.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.104.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.104.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.104.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.105.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.105.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.105.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.105.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.105.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.105.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.105.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.105.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.105.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.106.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.106.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.106.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.106.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.106.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.106.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.106.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.106.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.106.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.107.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.107.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.107.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.107.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.107.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.107.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.107.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.107.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.107.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.108.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.108.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.108.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.108.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.108.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.108.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.108.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.108.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.108.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.109.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.109.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.109.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.109.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.109.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.109.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.109.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.109.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.109.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.11.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.11.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.11.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.11.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.11.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.11.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.11.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.11.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.11.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.110.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.110.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.110.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.110.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.110.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.110.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.110.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.110.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.110.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.111.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.111.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.111.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.111.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.111.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.111.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.111.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.111.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.111.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.112.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.112.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.112.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.112.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.112.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.112.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.112.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.112.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.112.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.113.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.113.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.113.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.113.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.113.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.113.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.113.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.113.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.113.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.114.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.114.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.114.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.114.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.114.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.114.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.114.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.114.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.114.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.115.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.115.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.115.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.115.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.115.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.115.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.115.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.115.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.115.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.116.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.116.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.116.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.116.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.116.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.116.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.116.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.116.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.116.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.117.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.117.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.117.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.117.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.117.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.117.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.117.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.117.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.117.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.118.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.118.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.118.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.118.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.118.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.118.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.118.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.118.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.118.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.119.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.119.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.119.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.119.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.119.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.119.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.119.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.119.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.119.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.12.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.12.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.12.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.12.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.12.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.12.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.12.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.12.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.12.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.120.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.120.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.120.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.120.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.120.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.120.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.120.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.120.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.120.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.121.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.121.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.121.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.121.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.121.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.121.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.121.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.121.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.121.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.122.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.122.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.122.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.122.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.122.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.122.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.122.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.122.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.122.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.123.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.123.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.123.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.123.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.123.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.123.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.123.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.123.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.123.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.124.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.124.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.124.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.124.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.124.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.124.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.124.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.124.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.124.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.125.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.125.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.125.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.125.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.125.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.125.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.125.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.125.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.125.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.126.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.126.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.126.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.126.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.126.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.126.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.126.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.126.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.126.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.127.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.127.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.127.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.127.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.127.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.127.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.127.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.127.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.127.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.13.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.13.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.13.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.13.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.13.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.13.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.13.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.13.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.13.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.14.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.14.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.14.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.14.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.14.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.14.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.14.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.14.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.14.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.15.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.15.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.15.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.15.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.15.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.15.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.15.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.15.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.15.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.16.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.16.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.16.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.16.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.16.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.16.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.16.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.16.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.16.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.17.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.17.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.17.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.17.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.17.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.17.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.17.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.17.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.17.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.18.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.18.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.18.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.18.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.18.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.18.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.18.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.18.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.18.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.19.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.19.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.19.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.19.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.19.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.19.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.19.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.19.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.19.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.2.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.2.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.2.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.2.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.2.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.2.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.2.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.2.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.2.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.20.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.20.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.20.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.20.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.20.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.20.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.20.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.20.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.20.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.21.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.21.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.21.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.21.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.21.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.21.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.21.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.21.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.21.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.22.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.22.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.22.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.22.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.22.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.22.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.22.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.22.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.22.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.23.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.23.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.23.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.23.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.23.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.23.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.23.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.23.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.23.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.24.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.24.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.24.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.24.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.24.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.24.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.24.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.24.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.24.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.25.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.25.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.25.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.25.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.25.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.25.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.25.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.25.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.25.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.26.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.26.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.26.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.26.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.26.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.26.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.26.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.26.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.26.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.27.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.27.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.27.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.27.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.27.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.27.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.27.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.27.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.27.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.28.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.28.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.28.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.28.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.28.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.28.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.28.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.28.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.28.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.29.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.29.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.29.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.29.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.29.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.29.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.29.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.29.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.29.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.3.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.3.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.3.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.3.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.3.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.3.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.3.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.3.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.3.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.30.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.30.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.30.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.30.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.30.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.30.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.30.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.30.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.30.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.31.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.31.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.31.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.31.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.31.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.31.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.31.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.31.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.31.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.32.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.32.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.32.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.32.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.32.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.32.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.32.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.32.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.32.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.33.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.33.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.33.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.33.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.33.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.33.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.33.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.33.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.33.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.34.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.34.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.34.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.34.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.34.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.34.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.34.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.34.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.34.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.35.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.35.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.35.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.35.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.35.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.35.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.35.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.35.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.35.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.36.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.36.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.36.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.36.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.36.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.36.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.36.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.36.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.36.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.37.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.37.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.37.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.37.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.37.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.37.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.37.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.37.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.37.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.38.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.38.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.38.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.38.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.38.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.38.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.38.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.38.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.38.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.39.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.39.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.39.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.39.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.39.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.39.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.39.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.39.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.39.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.4.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.4.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.4.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.4.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.4.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.4.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.4.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.4.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.4.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.40.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.40.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.40.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.40.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.40.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.40.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.40.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.40.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.40.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.41.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.41.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.41.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.41.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.41.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.41.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.41.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.41.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.41.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.42.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.42.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.42.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.42.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.42.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.42.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.42.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.42.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.42.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.43.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.43.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.43.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.43.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.43.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.43.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.43.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.43.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.43.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.44.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.44.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.44.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.44.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.44.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.44.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.44.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.44.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.44.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.45.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.45.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.45.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.45.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.45.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.45.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.45.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.45.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.45.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.46.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.46.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.46.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.46.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.46.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.46.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.46.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.46.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.46.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.47.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.47.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.47.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.47.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.47.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.47.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.47.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.47.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.47.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.48.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.48.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.48.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.48.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.48.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.48.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.48.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.48.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.48.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.49.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.49.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.49.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.49.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.49.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.49.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.49.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.49.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.49.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.5.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.5.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.5.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.5.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.5.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.5.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.5.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.5.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.5.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.50.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.50.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.50.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.50.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.50.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.50.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.50.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.50.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.50.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.51.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.51.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.51.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.51.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.51.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.51.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.51.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.51.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.51.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.52.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.52.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.52.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.52.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.52.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.52.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.52.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.52.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.52.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.53.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.53.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.53.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.53.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.53.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.53.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.53.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.53.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.53.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.54.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.54.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.54.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.54.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.54.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.54.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.54.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.54.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.54.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.55.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.55.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.55.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.55.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.55.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.55.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.55.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.55.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.55.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.56.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.56.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.56.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.56.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.56.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.56.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.56.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.56.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.56.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.57.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.57.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.57.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.57.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.57.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.57.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.57.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.57.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.57.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.58.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.58.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.58.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.58.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.58.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.58.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.58.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.58.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.58.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.59.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.59.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.59.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.59.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.59.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.59.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.59.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.59.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.59.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.6.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.6.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.6.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.6.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.6.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.6.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.6.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.6.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.6.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.60.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.60.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.60.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.60.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.60.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.60.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.60.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.60.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.60.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.61.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.61.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.61.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.61.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.61.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.61.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.61.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.61.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.61.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.62.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.62.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.62.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.62.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.62.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.62.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.62.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.62.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.62.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.63.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.63.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.63.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.63.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.63.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.63.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.63.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.63.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.63.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.64.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.64.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.64.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.64.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.64.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.64.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.64.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.64.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.64.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.65.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.65.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.65.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.65.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.65.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.65.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.65.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.65.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.65.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.66.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.66.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.66.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.66.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.66.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.66.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.66.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.66.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.66.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.67.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.67.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.67.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.67.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.67.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.67.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.67.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.67.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.67.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.68.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.68.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.68.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.68.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.68.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.68.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.68.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.68.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.68.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.69.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.69.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.69.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.69.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.69.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.69.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.69.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.69.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.69.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.7.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.7.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.7.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.7.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.7.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.7.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.7.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.7.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.7.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.70.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.70.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.70.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.70.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.70.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.70.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.70.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.70.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.70.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.71.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.71.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.71.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.71.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.71.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.71.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.71.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.71.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.71.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.72.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.72.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.72.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.72.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.72.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.72.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.72.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.72.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.72.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.73.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.73.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.73.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.73.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.73.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.73.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.73.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.73.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.73.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.74.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.74.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.74.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.74.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.74.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.74.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.74.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.74.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.74.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.75.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.75.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.75.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.75.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.75.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.75.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.75.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.75.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.75.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.76.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.76.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.76.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.76.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.76.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.76.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.76.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.76.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.76.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.77.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.77.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.77.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.77.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.77.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.77.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.77.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.77.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.77.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.78.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.78.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.78.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.78.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.78.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.78.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.78.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.78.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.78.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.79.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.79.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.79.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.79.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.79.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.79.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.79.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.79.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.79.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.8.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.8.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.8.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.8.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.8.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.8.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.8.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.8.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.8.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.80.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.80.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.80.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.80.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.80.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.80.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.80.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.80.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.80.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.81.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.81.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.81.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.81.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.81.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.81.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.81.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.81.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.81.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.82.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.82.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.82.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.82.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.82.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.82.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.82.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.82.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.82.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.83.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.83.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.83.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.83.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.83.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.83.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.83.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.83.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.83.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.84.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.84.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.84.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.84.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.84.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.84.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.84.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.84.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.84.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.85.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.85.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.85.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.85.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.85.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.85.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.85.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.85.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.85.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.86.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.86.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.86.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.86.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.86.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.86.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.86.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.86.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.86.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.87.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.87.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.87.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.87.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.87.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.87.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.87.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.87.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.87.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.88.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.88.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.88.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.88.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.88.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.88.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.88.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.88.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.88.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.89.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.89.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.89.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.89.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.89.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.89.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.89.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.89.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.89.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.9.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.9.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.9.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.9.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.9.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.9.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.9.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.9.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.9.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.90.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.90.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.90.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.90.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.90.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.90.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.90.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.90.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.90.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.91.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.91.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.91.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.91.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.91.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.91.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.91.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.91.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.91.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.92.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.92.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.92.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.92.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.92.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.92.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.92.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.92.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.92.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.93.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.93.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.93.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.93.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.93.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.93.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.93.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.93.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.93.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.94.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.94.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.94.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.94.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.94.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.94.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.94.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.94.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.94.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.95.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.95.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.95.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.95.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.95.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.95.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.95.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.95.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.95.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.96.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.96.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.96.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.96.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.96.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.96.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.96.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.96.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.96.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.97.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.97.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.97.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.97.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.97.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.97.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.97.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.97.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.97.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.98.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.98.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.98.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.98.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.98.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.98.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.98.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.98.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.98.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.99.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.99.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.99.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.99.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.99.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.99.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.99.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.experts.99.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.experts.99.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.ffn_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.29.gate.weight": "consolidated-00008-of-00013.safetensors", "layers.29.shared_experts.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.shared_experts.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.shared_experts.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.shared_experts.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.shared_experts.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.shared_experts.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.29.shared_experts.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.29.shared_experts.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.29.shared_experts.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.attention.kv_a_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.3.attention.q_a_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.3.attention.wkv_a_with_mqa.weight": "consolidated-00008-of-00013.safetensors", "layers.3.attention.wkv_b.weight": "consolidated-00008-of-00013.safetensors", "layers.3.attention.wo.weight": "consolidated-00008-of-00013.safetensors", "layers.3.attention.wq_a.weight": "consolidated-00008-of-00013.safetensors", "layers.3.attention.wq_b.weight": "consolidated-00008-of-00013.safetensors", "layers.3.attention_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.3.experts.0.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.0.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.0.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.0.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.0.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.0.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.0.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.0.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.0.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.1.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.1.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.1.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.1.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.1.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.1.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.1.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.1.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.1.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.10.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.10.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.10.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.10.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.10.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.10.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.10.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.10.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.10.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.100.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.100.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.100.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.100.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.100.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.100.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.100.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.100.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.100.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.101.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.101.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.101.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.101.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.101.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.101.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.101.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.101.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.101.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.102.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.102.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.102.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.102.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.102.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.102.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.102.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.102.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.102.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.103.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.103.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.103.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.103.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.103.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.103.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.103.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.103.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.103.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.104.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.104.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.104.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.104.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.104.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.104.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.104.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.104.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.104.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.105.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.105.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.105.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.105.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.105.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.105.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.105.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.105.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.105.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.106.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.106.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.106.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.106.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.106.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.106.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.106.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.106.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.106.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.107.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.107.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.107.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.107.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.107.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.107.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.107.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.107.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.107.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.108.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.108.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.108.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.108.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.108.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.108.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.108.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.108.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.108.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.109.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.109.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.109.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.109.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.109.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.109.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.109.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.109.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.109.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.11.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.11.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.11.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.11.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.11.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.11.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.11.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.11.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.11.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.110.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.110.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.110.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.110.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.110.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.110.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.110.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.110.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.110.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.111.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.111.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.111.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.111.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.111.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.111.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.111.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.111.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.111.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.112.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.112.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.112.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.112.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.112.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.112.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.112.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.112.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.112.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.113.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.113.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.113.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.113.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.113.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.113.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.113.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.113.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.113.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.114.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.114.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.114.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.114.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.114.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.114.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.114.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.114.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.114.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.115.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.115.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.115.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.115.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.115.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.115.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.115.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.115.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.115.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.116.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.116.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.116.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.116.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.116.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.116.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.116.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.116.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.116.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.117.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.117.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.117.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.117.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.117.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.117.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.117.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.117.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.117.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.118.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.118.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.118.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.118.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.118.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.118.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.118.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.118.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.118.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.119.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.119.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.119.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.119.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.119.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.119.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.119.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.119.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.119.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.12.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.12.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.12.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.12.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.12.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.12.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.12.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.12.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.12.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.120.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.120.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.120.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.120.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.120.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.120.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.120.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.120.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.120.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.121.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.121.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.121.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.121.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.121.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.121.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.121.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.121.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.121.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.122.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.122.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.122.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.122.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.122.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.122.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.122.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.122.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.122.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.123.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.123.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.123.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.123.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.123.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.123.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.123.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.123.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.123.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.124.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.124.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.124.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.124.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.124.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.124.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.124.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.124.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.124.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.125.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.125.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.125.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.125.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.125.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.125.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.125.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.125.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.125.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.126.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.126.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.126.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.126.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.126.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.126.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.126.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.126.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.126.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.127.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.127.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.127.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.127.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.127.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.127.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.127.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.127.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.127.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.13.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.13.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.13.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.13.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.13.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.13.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.13.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.13.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.13.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.14.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.14.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.14.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.14.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.14.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.14.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.14.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.14.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.14.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.15.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.15.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.15.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.15.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.15.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.15.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.15.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.15.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.15.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.16.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.16.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.16.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.16.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.16.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.16.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.16.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.16.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.16.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.17.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.17.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.17.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.17.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.17.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.17.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.17.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.17.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.17.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.18.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.18.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.18.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.18.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.18.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.18.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.18.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.18.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.18.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.19.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.19.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.19.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.19.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.19.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.19.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.19.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.19.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.19.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.2.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.2.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.2.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.2.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.2.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.2.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.2.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.2.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.2.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.20.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.20.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.20.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.20.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.20.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.20.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.20.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.20.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.20.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.21.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.21.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.21.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.21.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.21.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.21.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.21.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.21.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.21.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.22.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.22.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.22.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.22.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.22.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.22.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.22.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.22.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.22.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.23.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.23.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.23.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.23.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.23.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.23.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.23.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.23.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.23.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.24.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.24.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.24.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.24.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.24.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.24.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.24.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.24.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.24.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.25.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.25.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.25.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.25.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.25.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.25.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.25.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.25.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.25.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.26.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.26.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.26.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.26.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.26.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.26.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.26.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.26.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.26.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.27.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.27.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.27.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.27.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.27.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.27.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.27.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.27.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.27.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.28.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.28.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.28.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.28.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.28.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.28.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.28.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.28.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.28.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.29.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.29.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.29.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.29.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.29.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.29.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.29.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.29.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.29.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.3.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.3.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.3.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.3.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.3.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.3.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.3.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.3.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.3.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.30.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.30.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.30.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.30.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.30.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.30.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.30.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.30.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.30.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.31.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.31.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.31.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.31.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.31.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.31.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.31.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.31.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.31.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.32.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.32.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.32.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.32.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.32.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.32.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.32.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.32.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.32.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.33.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.33.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.33.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.33.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.33.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.33.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.33.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.33.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.33.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.34.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.34.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.34.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.34.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.34.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.34.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.34.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.34.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.34.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.35.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.35.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.35.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.35.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.35.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.35.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.35.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.35.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.35.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.36.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.36.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.36.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.36.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.36.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.36.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.36.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.36.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.36.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.37.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.37.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.37.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.37.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.37.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.37.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.37.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.37.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.37.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.38.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.38.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.38.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.38.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.38.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.38.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.38.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.38.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.38.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.39.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.39.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.39.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.39.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.39.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.39.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.39.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.39.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.39.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.4.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.4.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.4.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.4.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.4.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.4.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.4.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.4.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.4.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.40.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.40.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.40.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.40.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.40.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.40.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.40.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.40.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.40.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.41.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.41.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.41.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.41.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.41.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.41.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.41.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.41.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.41.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.42.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.42.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.42.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.42.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.42.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.42.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.42.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.42.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.42.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.43.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.43.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.43.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.43.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.43.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.43.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.43.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.43.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.43.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.44.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.44.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.44.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.44.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.44.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.44.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.44.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.44.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.44.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.45.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.45.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.45.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.45.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.45.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.45.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.45.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.45.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.45.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.46.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.46.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.46.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.46.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.46.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.46.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.46.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.46.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.46.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.47.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.47.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.47.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.47.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.47.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.47.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.47.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.47.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.47.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.48.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.48.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.48.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.48.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.48.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.48.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.48.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.48.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.48.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.49.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.49.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.49.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.49.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.49.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.49.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.49.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.49.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.49.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.5.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.5.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.5.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.5.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.5.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.5.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.5.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.5.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.5.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.50.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.50.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.50.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.50.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.50.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.50.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.50.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.50.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.50.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.51.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.51.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.51.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.51.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.51.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.51.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.51.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.51.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.51.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.52.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.52.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.52.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.52.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.52.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.52.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.52.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.52.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.52.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.53.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.53.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.53.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.53.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.53.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.53.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.53.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.53.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.53.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.54.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.54.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.54.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.54.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.54.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.54.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.54.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.54.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.54.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.55.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.55.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.55.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.55.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.55.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.55.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.55.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.55.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.55.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.56.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.56.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.56.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.56.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.56.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.56.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.56.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.56.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.56.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.57.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.57.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.57.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.57.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.57.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.57.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.57.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.57.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.57.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.58.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.58.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.58.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.58.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.58.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.58.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.58.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.58.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.58.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.59.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.59.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.59.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.59.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.59.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.59.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.59.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.59.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.59.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.6.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.6.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.6.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.6.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.6.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.6.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.6.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.6.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.6.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.60.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.60.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.60.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.60.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.60.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.60.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.60.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.60.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.60.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.61.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.61.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.61.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.61.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.61.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.61.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.61.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.61.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.61.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.62.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.62.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.62.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.62.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.62.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.62.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.62.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.62.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.62.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.63.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.63.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.63.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.63.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.63.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.63.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.63.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.63.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.63.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.64.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.64.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.64.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.64.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.64.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.64.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.64.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.64.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.64.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.65.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.65.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.65.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.65.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.65.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.65.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.65.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.65.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.65.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.66.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.66.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.66.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.66.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.66.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.66.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.66.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.66.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.66.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.67.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.67.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.67.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.67.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.67.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.67.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.67.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.67.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.67.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.68.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.68.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.68.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.68.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.68.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.68.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.68.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.68.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.68.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.69.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.69.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.69.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.69.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.69.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.69.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.69.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.69.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.69.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.7.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.7.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.7.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.7.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.7.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.7.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.7.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.7.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.7.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.70.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.70.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.70.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.70.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.70.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.70.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.70.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.70.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.70.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.71.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.71.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.71.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.71.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.71.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.71.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.71.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.71.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.71.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.72.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.72.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.72.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.72.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.72.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.72.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.72.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.72.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.72.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.73.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.73.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.73.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.73.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.73.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.73.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.73.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.73.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.73.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.74.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.74.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.74.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.74.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.74.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.74.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.74.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.74.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.74.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.75.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.75.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.75.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.75.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.75.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.75.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.75.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.75.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.75.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.76.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.76.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.76.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.76.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.76.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.76.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.76.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.76.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.76.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.77.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.77.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.77.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.77.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.77.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.77.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.77.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.77.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.77.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.78.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.78.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.78.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.78.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.78.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.78.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.78.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.78.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.78.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.79.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.79.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.79.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.79.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.79.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.79.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.79.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.79.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.79.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.8.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.8.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.8.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.8.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.8.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.8.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.8.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.8.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.8.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.80.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.80.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.80.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.80.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.80.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.80.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.80.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.80.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.80.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.81.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.81.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.81.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.81.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.81.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.81.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.81.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.81.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.81.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.82.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.82.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.82.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.82.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.82.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.82.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.82.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.82.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.82.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.83.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.83.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.83.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.83.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.83.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.83.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.83.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.83.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.83.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.84.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.84.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.84.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.84.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.84.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.84.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.84.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.84.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.84.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.85.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.85.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.85.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.85.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.85.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.85.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.85.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.85.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.85.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.86.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.86.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.86.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.86.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.86.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.86.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.86.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.86.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.86.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.87.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.87.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.87.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.87.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.87.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.87.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.87.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.87.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.87.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.88.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.88.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.88.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.88.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.88.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.88.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.88.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.88.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.88.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.89.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.89.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.89.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.89.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.89.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.89.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.89.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.89.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.89.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.9.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.9.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.9.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.9.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.9.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.9.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.9.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.9.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.9.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.90.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.90.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.90.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.90.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.90.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.90.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.90.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.90.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.90.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.91.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.91.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.91.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.91.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.91.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.91.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.91.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.91.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.91.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.92.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.92.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.92.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.92.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.92.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.92.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.92.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.92.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.92.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.93.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.93.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.93.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.93.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.93.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.93.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.93.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.93.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.93.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.94.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.94.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.94.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.94.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.94.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.94.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.94.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.94.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.94.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.95.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.95.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.95.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.95.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.95.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.95.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.95.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.95.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.95.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.96.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.96.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.96.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.96.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.96.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.96.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.96.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.96.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.96.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.97.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.97.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.97.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.97.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.97.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.97.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.97.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.97.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.97.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.98.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.98.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.98.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.98.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.98.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.98.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.98.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.98.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.98.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.99.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.99.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.99.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.99.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.99.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.99.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.99.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.experts.99.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.experts.99.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.ffn_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.3.gate.weight": "consolidated-00008-of-00013.safetensors", "layers.3.shared_experts.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.shared_experts.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.shared_experts.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.shared_experts.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.shared_experts.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.shared_experts.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.3.shared_experts.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.3.shared_experts.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.3.shared_experts.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.attention.kv_a_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.30.attention.q_a_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.30.attention.wkv_a_with_mqa.weight": "consolidated-00008-of-00013.safetensors", "layers.30.attention.wkv_b.weight": "consolidated-00008-of-00013.safetensors", "layers.30.attention.wo.weight": "consolidated-00008-of-00013.safetensors", "layers.30.attention.wq_a.weight": "consolidated-00008-of-00013.safetensors", "layers.30.attention.wq_b.weight": "consolidated-00008-of-00013.safetensors", "layers.30.attention_norm.weight": "consolidated-00008-of-00013.safetensors", "layers.30.experts.0.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.0.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.0.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.0.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.0.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.0.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.0.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.0.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.0.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.1.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.1.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.1.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.1.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.1.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.1.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.1.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.1.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.1.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.10.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.10.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.10.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.10.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.10.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.10.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.10.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.10.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.10.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.100.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.100.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.100.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.100.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.100.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.100.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.100.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.100.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.100.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.101.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.101.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.101.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.101.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.101.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.101.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.101.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.101.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.101.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.102.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.102.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.102.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.102.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.102.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.102.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.102.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.102.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.102.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.103.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.103.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.103.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.103.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.103.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.103.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.103.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.103.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.103.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.104.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.104.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.104.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.104.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.104.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.104.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.104.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.104.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.104.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.105.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.105.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.105.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.105.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.105.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.105.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.105.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.105.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.105.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.106.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.106.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.106.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.106.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.106.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.106.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.106.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.106.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.106.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.107.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.107.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.107.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.107.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.107.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.107.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.107.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.107.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.107.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.108.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.108.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.108.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.108.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.108.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.108.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.108.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.108.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.108.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.109.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.109.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.109.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.109.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.109.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.109.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.109.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.109.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.109.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.11.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.11.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.11.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.11.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.11.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.11.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.11.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.11.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.11.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.110.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.110.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.110.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.110.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.110.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.110.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.110.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.110.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.110.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.111.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.111.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.111.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.111.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.111.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.111.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.111.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.111.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.111.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.112.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.112.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.112.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.112.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.112.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.112.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.112.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.112.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.112.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.113.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.113.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.113.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.113.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.113.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.113.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.113.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.113.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.113.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.114.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.114.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.114.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.114.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.114.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.114.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.114.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.114.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.114.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.115.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.115.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.115.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.115.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.115.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.115.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.115.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.115.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.115.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.116.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.116.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.116.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.116.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.116.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.116.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.116.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.116.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.116.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.117.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.117.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.117.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.117.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.117.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.117.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.117.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.117.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.117.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.118.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.118.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.118.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.118.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.118.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.118.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.118.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.118.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.118.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.119.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.119.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.119.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.119.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.119.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.119.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.119.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.119.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.119.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.12.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.12.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.12.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.12.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.12.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.12.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.12.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.12.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.12.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.120.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.120.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.120.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.120.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.120.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.120.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.120.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.120.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.120.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.121.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.121.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.121.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.121.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.121.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.121.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.121.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.121.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.121.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.122.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.122.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.122.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.122.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.122.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.122.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.122.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.122.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.122.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.123.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.123.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.123.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.123.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.123.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.123.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.123.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.123.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.123.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.124.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.124.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.124.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.124.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.124.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.124.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.124.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.124.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.124.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.125.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.125.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.125.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.125.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.125.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.125.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.125.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.125.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.125.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.126.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.126.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.126.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.126.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.126.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.126.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.126.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.126.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.126.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.127.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.127.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.127.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.127.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.127.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.127.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.127.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.127.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.127.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.13.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.13.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.13.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.13.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.13.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.13.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.13.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.13.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.13.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.14.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.14.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.14.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.14.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.14.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.14.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.14.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.14.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.14.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.15.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.15.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.15.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.15.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.15.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.15.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.15.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.15.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.15.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.16.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.16.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.16.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.16.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.16.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.16.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.16.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.16.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.16.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.17.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.17.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.17.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.17.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.17.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.17.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.17.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.17.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.17.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.18.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.18.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.18.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.18.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.18.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.18.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.18.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.18.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.18.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.19.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.19.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.19.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.19.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.19.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.19.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.19.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.19.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.19.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.2.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.2.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.2.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.2.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.2.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.2.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.2.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.2.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.2.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.20.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.20.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.20.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.20.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.20.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.20.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.20.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.20.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.20.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.21.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.21.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.21.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.21.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.21.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.21.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.21.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.21.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.21.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.22.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.22.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.22.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.22.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.22.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.22.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.22.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.22.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.22.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.23.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.23.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.23.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.23.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.23.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.23.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.23.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.23.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.23.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.24.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.24.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.24.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.24.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.24.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.24.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.24.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.24.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.24.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.25.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.25.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.25.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.25.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.25.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.25.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.25.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.25.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.25.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.26.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.26.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.26.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.26.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.26.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.26.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.26.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.26.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.26.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.27.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.27.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.27.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.27.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.27.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.27.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.27.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.27.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.27.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.28.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.28.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.28.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.28.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.28.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.28.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.28.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.28.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.28.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.29.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.29.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.29.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.29.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.29.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.29.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.29.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.29.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.29.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.3.w1.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.3.w1.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.3.w1.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.3.w2.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.3.w2.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.3.w2.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.3.w3.weight_global_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.3.w3.weight_packed": "consolidated-00008-of-00013.safetensors", "layers.30.experts.3.w3.weight_scale": "consolidated-00008-of-00013.safetensors", "layers.30.experts.30.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.30.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.30.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.30.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.30.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.30.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.30.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.30.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.30.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.31.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.31.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.31.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.31.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.31.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.31.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.31.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.31.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.31.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.32.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.32.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.32.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.32.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.32.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.32.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.32.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.32.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.32.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.33.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.33.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.33.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.33.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.33.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.33.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.33.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.33.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.33.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.34.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.34.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.34.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.34.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.34.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.34.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.34.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.34.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.34.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.35.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.35.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.35.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.35.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.35.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.35.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.35.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.35.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.35.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.36.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.36.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.36.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.36.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.36.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.36.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.36.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.36.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.36.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.37.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.37.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.37.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.37.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.37.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.37.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.37.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.37.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.37.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.38.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.38.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.38.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.38.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.38.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.38.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.38.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.38.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.38.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.39.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.39.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.39.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.39.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.39.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.39.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.39.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.39.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.39.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.4.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.4.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.4.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.4.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.4.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.4.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.4.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.4.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.4.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.40.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.40.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.40.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.40.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.40.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.40.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.40.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.40.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.40.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.41.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.41.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.41.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.41.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.41.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.41.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.41.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.41.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.41.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.42.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.42.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.42.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.42.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.42.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.42.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.42.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.42.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.42.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.43.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.43.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.43.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.43.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.43.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.43.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.43.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.43.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.43.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.44.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.44.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.44.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.44.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.44.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.44.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.44.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.44.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.44.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.45.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.45.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.45.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.45.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.45.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.45.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.45.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.45.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.45.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.46.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.46.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.46.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.46.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.46.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.46.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.46.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.46.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.46.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.47.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.47.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.47.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.47.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.47.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.47.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.47.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.47.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.47.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.48.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.48.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.48.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.48.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.48.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.48.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.48.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.48.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.48.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.49.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.49.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.49.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.49.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.49.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.49.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.49.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.49.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.49.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.5.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.5.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.5.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.5.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.5.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.5.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.5.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.5.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.5.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.50.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.50.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.50.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.50.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.50.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.50.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.50.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.50.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.50.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.51.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.51.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.51.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.51.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.51.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.51.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.51.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.51.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.51.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.52.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.52.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.52.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.52.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.52.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.52.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.52.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.52.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.52.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.53.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.53.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.53.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.53.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.53.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.53.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.53.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.53.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.53.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.54.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.54.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.54.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.54.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.54.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.54.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.54.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.54.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.54.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.55.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.55.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.55.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.55.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.55.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.55.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.55.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.55.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.55.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.56.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.56.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.56.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.56.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.56.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.56.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.56.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.56.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.56.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.57.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.57.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.57.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.57.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.57.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.57.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.57.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.57.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.57.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.58.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.58.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.58.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.58.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.58.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.58.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.58.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.58.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.58.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.59.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.59.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.59.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.59.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.59.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.59.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.59.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.59.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.59.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.6.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.6.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.6.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.6.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.6.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.6.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.6.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.6.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.6.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.60.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.60.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.60.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.60.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.60.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.60.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.60.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.60.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.60.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.61.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.61.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.61.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.61.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.61.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.61.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.61.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.61.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.61.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.62.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.62.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.62.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.62.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.62.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.62.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.62.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.62.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.62.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.63.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.63.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.63.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.63.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.63.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.63.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.63.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.63.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.63.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.64.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.64.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.64.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.64.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.64.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.64.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.64.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.64.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.64.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.65.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.65.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.65.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.65.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.65.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.65.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.65.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.65.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.65.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.66.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.66.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.66.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.66.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.66.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.66.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.66.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.66.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.66.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.67.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.67.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.67.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.67.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.67.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.67.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.67.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.67.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.67.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.68.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.68.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.68.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.68.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.68.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.68.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.68.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.68.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.68.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.69.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.69.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.69.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.69.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.69.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.69.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.69.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.69.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.69.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.7.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.7.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.7.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.7.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.7.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.7.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.7.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.7.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.7.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.70.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.70.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.70.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.70.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.70.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.70.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.70.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.70.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.70.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.71.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.71.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.71.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.71.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.71.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.71.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.71.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.71.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.71.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.72.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.72.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.72.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.72.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.72.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.72.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.72.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.72.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.72.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.73.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.73.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.73.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.73.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.73.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.73.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.73.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.73.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.73.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.74.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.74.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.74.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.74.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.74.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.74.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.74.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.74.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.74.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.75.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.75.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.75.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.75.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.75.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.75.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.75.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.75.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.75.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.76.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.76.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.76.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.76.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.76.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.76.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.76.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.76.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.76.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.77.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.77.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.77.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.77.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.77.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.77.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.77.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.77.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.77.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.78.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.78.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.78.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.78.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.78.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.78.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.78.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.78.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.78.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.79.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.79.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.79.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.79.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.79.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.79.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.79.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.79.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.79.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.8.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.8.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.8.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.8.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.8.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.8.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.8.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.8.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.8.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.80.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.80.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.80.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.80.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.80.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.80.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.80.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.80.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.80.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.81.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.81.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.81.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.81.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.81.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.81.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.81.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.81.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.81.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.82.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.82.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.82.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.82.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.82.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.82.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.82.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.82.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.82.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.83.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.83.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.83.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.83.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.83.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.83.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.83.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.83.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.83.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.84.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.84.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.84.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.84.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.84.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.84.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.84.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.84.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.84.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.85.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.85.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.85.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.85.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.85.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.85.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.85.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.85.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.85.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.86.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.86.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.86.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.86.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.86.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.86.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.86.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.86.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.86.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.87.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.87.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.87.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.87.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.87.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.87.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.87.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.87.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.87.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.88.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.88.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.88.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.88.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.88.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.88.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.88.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.88.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.88.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.89.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.89.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.89.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.89.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.89.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.89.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.89.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.89.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.89.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.9.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.9.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.9.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.9.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.9.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.9.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.9.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.9.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.9.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.90.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.90.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.90.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.90.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.90.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.90.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.90.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.90.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.90.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.91.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.91.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.91.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.91.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.91.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.91.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.91.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.91.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.91.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.92.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.92.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.92.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.92.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.92.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.92.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.92.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.92.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.92.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.93.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.93.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.93.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.93.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.93.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.93.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.93.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.93.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.93.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.94.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.94.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.94.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.94.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.94.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.94.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.94.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.94.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.94.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.95.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.95.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.95.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.95.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.95.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.95.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.95.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.95.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.95.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.96.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.96.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.96.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.96.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.96.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.96.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.96.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.96.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.96.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.97.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.97.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.97.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.97.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.97.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.97.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.97.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.97.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.97.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.98.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.98.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.98.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.98.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.98.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.98.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.98.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.98.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.98.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.99.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.99.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.99.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.99.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.99.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.99.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.99.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.experts.99.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.experts.99.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.ffn_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.30.gate.weight": "consolidated-00009-of-00013.safetensors", "layers.30.shared_experts.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.shared_experts.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.shared_experts.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.shared_experts.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.shared_experts.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.shared_experts.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.30.shared_experts.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.30.shared_experts.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.30.shared_experts.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.attention.kv_a_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.31.attention.q_a_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.31.attention.wkv_a_with_mqa.weight": "consolidated-00009-of-00013.safetensors", "layers.31.attention.wkv_b.weight": "consolidated-00009-of-00013.safetensors", "layers.31.attention.wo.weight": "consolidated-00009-of-00013.safetensors", "layers.31.attention.wq_a.weight": "consolidated-00009-of-00013.safetensors", "layers.31.attention.wq_b.weight": "consolidated-00009-of-00013.safetensors", "layers.31.attention_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.31.experts.0.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.0.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.0.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.0.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.0.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.0.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.0.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.0.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.0.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.1.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.1.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.1.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.1.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.1.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.1.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.1.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.1.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.1.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.10.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.10.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.10.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.10.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.10.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.10.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.10.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.10.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.10.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.100.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.100.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.100.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.100.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.100.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.100.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.100.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.100.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.100.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.101.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.101.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.101.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.101.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.101.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.101.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.101.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.101.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.101.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.102.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.102.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.102.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.102.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.102.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.102.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.102.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.102.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.102.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.103.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.103.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.103.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.103.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.103.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.103.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.103.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.103.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.103.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.104.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.104.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.104.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.104.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.104.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.104.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.104.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.104.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.104.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.105.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.105.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.105.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.105.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.105.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.105.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.105.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.105.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.105.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.106.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.106.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.106.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.106.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.106.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.106.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.106.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.106.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.106.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.107.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.107.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.107.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.107.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.107.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.107.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.107.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.107.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.107.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.108.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.108.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.108.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.108.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.108.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.108.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.108.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.108.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.108.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.109.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.109.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.109.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.109.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.109.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.109.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.109.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.109.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.109.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.11.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.11.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.11.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.11.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.11.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.11.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.11.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.11.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.11.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.110.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.110.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.110.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.110.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.110.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.110.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.110.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.110.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.110.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.111.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.111.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.111.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.111.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.111.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.111.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.111.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.111.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.111.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.112.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.112.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.112.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.112.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.112.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.112.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.112.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.112.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.112.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.113.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.113.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.113.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.113.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.113.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.113.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.113.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.113.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.113.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.114.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.114.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.114.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.114.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.114.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.114.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.114.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.114.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.114.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.115.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.115.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.115.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.115.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.115.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.115.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.115.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.115.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.115.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.116.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.116.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.116.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.116.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.116.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.116.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.116.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.116.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.116.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.117.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.117.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.117.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.117.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.117.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.117.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.117.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.117.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.117.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.118.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.118.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.118.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.118.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.118.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.118.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.118.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.118.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.118.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.119.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.119.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.119.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.119.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.119.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.119.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.119.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.119.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.119.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.12.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.12.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.12.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.12.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.12.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.12.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.12.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.12.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.12.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.120.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.120.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.120.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.120.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.120.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.120.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.120.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.120.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.120.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.121.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.121.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.121.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.121.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.121.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.121.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.121.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.121.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.121.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.122.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.122.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.122.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.122.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.122.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.122.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.122.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.122.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.122.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.123.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.123.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.123.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.123.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.123.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.123.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.123.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.123.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.123.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.124.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.124.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.124.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.124.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.124.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.124.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.124.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.124.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.124.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.125.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.125.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.125.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.125.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.125.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.125.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.125.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.125.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.125.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.126.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.126.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.126.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.126.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.126.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.126.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.126.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.126.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.126.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.127.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.127.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.127.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.127.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.127.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.127.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.127.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.127.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.127.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.13.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.13.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.13.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.13.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.13.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.13.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.13.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.13.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.13.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.14.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.14.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.14.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.14.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.14.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.14.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.14.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.14.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.14.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.15.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.15.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.15.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.15.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.15.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.15.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.15.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.15.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.15.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.16.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.16.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.16.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.16.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.16.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.16.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.16.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.16.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.16.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.17.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.17.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.17.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.17.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.17.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.17.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.17.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.17.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.17.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.18.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.18.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.18.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.18.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.18.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.18.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.18.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.18.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.18.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.19.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.19.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.19.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.19.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.19.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.19.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.19.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.19.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.19.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.2.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.2.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.2.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.2.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.2.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.2.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.2.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.2.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.2.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.20.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.20.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.20.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.20.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.20.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.20.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.20.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.20.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.20.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.21.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.21.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.21.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.21.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.21.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.21.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.21.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.21.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.21.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.22.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.22.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.22.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.22.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.22.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.22.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.22.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.22.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.22.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.23.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.23.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.23.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.23.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.23.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.23.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.23.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.23.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.23.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.24.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.24.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.24.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.24.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.24.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.24.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.24.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.24.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.24.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.25.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.25.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.25.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.25.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.25.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.25.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.25.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.25.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.25.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.26.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.26.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.26.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.26.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.26.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.26.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.26.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.26.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.26.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.27.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.27.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.27.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.27.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.27.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.27.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.27.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.27.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.27.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.28.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.28.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.28.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.28.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.28.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.28.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.28.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.28.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.28.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.29.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.29.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.29.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.29.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.29.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.29.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.29.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.29.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.29.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.3.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.3.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.3.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.3.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.3.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.3.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.3.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.3.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.3.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.30.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.30.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.30.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.30.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.30.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.30.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.30.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.30.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.30.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.31.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.31.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.31.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.31.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.31.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.31.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.31.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.31.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.31.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.32.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.32.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.32.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.32.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.32.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.32.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.32.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.32.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.32.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.33.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.33.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.33.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.33.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.33.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.33.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.33.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.33.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.33.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.34.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.34.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.34.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.34.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.34.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.34.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.34.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.34.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.34.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.35.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.35.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.35.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.35.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.35.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.35.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.35.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.35.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.35.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.36.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.36.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.36.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.36.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.36.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.36.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.36.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.36.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.36.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.37.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.37.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.37.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.37.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.37.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.37.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.37.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.37.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.37.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.38.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.38.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.38.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.38.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.38.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.38.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.38.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.38.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.38.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.39.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.39.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.39.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.39.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.39.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.39.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.39.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.39.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.39.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.4.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.4.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.4.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.4.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.4.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.4.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.4.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.4.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.4.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.40.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.40.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.40.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.40.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.40.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.40.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.40.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.40.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.40.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.41.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.41.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.41.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.41.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.41.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.41.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.41.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.41.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.41.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.42.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.42.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.42.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.42.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.42.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.42.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.42.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.42.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.42.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.43.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.43.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.43.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.43.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.43.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.43.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.43.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.43.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.43.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.44.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.44.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.44.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.44.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.44.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.44.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.44.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.44.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.44.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.45.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.45.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.45.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.45.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.45.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.45.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.45.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.45.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.45.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.46.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.46.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.46.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.46.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.46.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.46.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.46.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.46.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.46.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.47.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.47.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.47.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.47.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.47.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.47.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.47.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.47.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.47.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.48.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.48.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.48.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.48.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.48.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.48.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.48.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.48.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.48.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.49.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.49.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.49.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.49.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.49.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.49.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.49.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.49.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.49.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.5.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.5.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.5.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.5.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.5.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.5.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.5.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.5.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.5.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.50.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.50.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.50.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.50.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.50.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.50.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.50.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.50.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.50.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.51.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.51.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.51.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.51.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.51.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.51.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.51.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.51.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.51.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.52.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.52.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.52.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.52.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.52.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.52.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.52.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.52.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.52.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.53.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.53.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.53.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.53.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.53.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.53.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.53.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.53.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.53.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.54.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.54.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.54.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.54.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.54.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.54.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.54.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.54.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.54.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.55.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.55.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.55.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.55.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.55.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.55.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.55.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.55.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.55.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.56.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.56.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.56.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.56.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.56.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.56.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.56.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.56.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.56.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.57.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.57.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.57.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.57.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.57.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.57.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.57.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.57.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.57.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.58.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.58.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.58.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.58.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.58.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.58.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.58.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.58.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.58.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.59.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.59.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.59.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.59.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.59.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.59.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.59.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.59.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.59.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.6.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.6.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.6.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.6.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.6.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.6.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.6.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.6.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.6.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.60.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.60.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.60.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.60.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.60.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.60.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.60.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.60.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.60.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.61.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.61.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.61.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.61.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.61.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.61.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.61.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.61.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.61.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.62.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.62.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.62.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.62.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.62.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.62.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.62.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.62.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.62.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.63.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.63.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.63.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.63.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.63.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.63.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.63.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.63.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.63.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.64.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.64.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.64.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.64.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.64.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.64.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.64.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.64.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.64.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.65.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.65.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.65.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.65.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.65.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.65.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.65.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.65.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.65.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.66.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.66.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.66.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.66.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.66.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.66.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.66.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.66.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.66.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.67.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.67.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.67.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.67.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.67.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.67.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.67.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.67.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.67.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.68.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.68.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.68.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.68.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.68.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.68.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.68.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.68.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.68.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.69.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.69.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.69.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.69.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.69.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.69.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.69.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.69.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.69.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.7.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.7.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.7.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.7.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.7.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.7.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.7.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.7.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.7.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.70.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.70.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.70.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.70.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.70.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.70.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.70.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.70.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.70.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.71.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.71.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.71.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.71.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.71.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.71.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.71.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.71.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.71.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.72.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.72.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.72.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.72.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.72.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.72.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.72.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.72.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.72.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.73.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.73.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.73.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.73.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.73.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.73.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.73.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.73.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.73.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.74.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.74.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.74.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.74.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.74.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.74.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.74.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.74.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.74.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.75.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.75.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.75.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.75.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.75.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.75.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.75.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.75.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.75.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.76.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.76.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.76.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.76.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.76.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.76.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.76.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.76.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.76.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.77.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.77.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.77.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.77.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.77.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.77.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.77.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.77.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.77.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.78.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.78.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.78.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.78.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.78.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.78.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.78.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.78.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.78.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.79.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.79.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.79.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.79.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.79.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.79.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.79.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.79.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.79.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.8.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.8.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.8.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.8.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.8.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.8.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.8.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.8.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.8.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.80.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.80.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.80.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.80.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.80.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.80.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.80.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.80.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.80.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.81.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.81.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.81.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.81.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.81.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.81.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.81.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.81.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.81.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.82.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.82.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.82.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.82.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.82.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.82.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.82.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.82.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.82.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.83.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.83.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.83.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.83.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.83.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.83.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.83.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.83.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.83.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.84.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.84.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.84.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.84.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.84.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.84.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.84.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.84.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.84.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.85.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.85.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.85.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.85.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.85.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.85.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.85.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.85.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.85.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.86.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.86.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.86.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.86.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.86.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.86.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.86.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.86.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.86.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.87.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.87.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.87.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.87.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.87.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.87.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.87.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.87.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.87.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.88.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.88.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.88.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.88.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.88.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.88.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.88.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.88.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.88.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.89.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.89.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.89.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.89.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.89.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.89.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.89.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.89.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.89.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.9.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.9.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.9.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.9.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.9.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.9.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.9.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.9.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.9.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.90.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.90.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.90.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.90.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.90.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.90.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.90.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.90.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.90.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.91.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.91.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.91.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.91.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.91.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.91.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.91.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.91.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.91.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.92.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.92.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.92.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.92.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.92.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.92.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.92.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.92.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.92.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.93.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.93.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.93.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.93.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.93.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.93.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.93.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.93.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.93.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.94.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.94.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.94.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.94.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.94.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.94.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.94.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.94.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.94.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.95.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.95.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.95.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.95.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.95.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.95.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.95.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.95.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.95.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.96.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.96.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.96.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.96.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.96.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.96.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.96.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.96.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.96.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.97.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.97.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.97.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.97.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.97.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.97.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.97.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.97.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.97.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.98.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.98.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.98.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.98.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.98.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.98.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.98.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.98.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.98.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.99.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.99.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.99.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.99.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.99.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.99.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.99.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.experts.99.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.experts.99.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.ffn_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.31.gate.weight": "consolidated-00009-of-00013.safetensors", "layers.31.shared_experts.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.shared_experts.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.shared_experts.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.shared_experts.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.shared_experts.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.shared_experts.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.31.shared_experts.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.31.shared_experts.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.31.shared_experts.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.attention.kv_a_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.32.attention.q_a_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.32.attention.wkv_a_with_mqa.weight": "consolidated-00009-of-00013.safetensors", "layers.32.attention.wkv_b.weight": "consolidated-00009-of-00013.safetensors", "layers.32.attention.wo.weight": "consolidated-00009-of-00013.safetensors", "layers.32.attention.wq_a.weight": "consolidated-00009-of-00013.safetensors", "layers.32.attention.wq_b.weight": "consolidated-00009-of-00013.safetensors", "layers.32.attention_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.32.experts.0.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.0.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.0.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.0.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.0.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.0.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.0.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.0.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.0.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.1.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.1.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.1.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.1.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.1.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.1.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.1.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.1.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.1.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.10.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.10.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.10.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.10.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.10.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.10.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.10.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.10.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.10.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.100.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.100.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.100.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.100.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.100.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.100.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.100.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.100.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.100.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.101.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.101.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.101.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.101.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.101.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.101.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.101.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.101.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.101.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.102.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.102.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.102.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.102.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.102.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.102.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.102.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.102.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.102.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.103.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.103.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.103.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.103.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.103.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.103.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.103.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.103.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.103.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.104.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.104.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.104.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.104.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.104.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.104.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.104.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.104.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.104.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.105.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.105.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.105.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.105.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.105.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.105.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.105.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.105.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.105.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.106.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.106.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.106.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.106.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.106.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.106.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.106.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.106.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.106.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.107.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.107.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.107.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.107.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.107.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.107.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.107.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.107.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.107.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.108.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.108.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.108.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.108.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.108.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.108.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.108.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.108.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.108.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.109.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.109.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.109.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.109.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.109.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.109.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.109.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.109.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.109.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.11.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.11.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.11.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.11.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.11.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.11.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.11.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.11.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.11.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.110.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.110.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.110.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.110.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.110.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.110.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.110.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.110.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.110.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.111.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.111.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.111.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.111.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.111.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.111.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.111.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.111.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.111.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.112.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.112.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.112.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.112.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.112.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.112.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.112.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.112.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.112.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.113.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.113.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.113.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.113.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.113.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.113.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.113.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.113.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.113.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.114.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.114.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.114.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.114.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.114.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.114.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.114.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.114.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.114.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.115.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.115.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.115.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.115.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.115.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.115.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.115.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.115.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.115.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.116.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.116.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.116.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.116.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.116.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.116.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.116.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.116.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.116.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.117.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.117.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.117.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.117.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.117.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.117.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.117.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.117.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.117.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.118.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.118.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.118.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.118.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.118.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.118.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.118.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.118.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.118.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.119.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.119.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.119.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.119.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.119.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.119.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.119.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.119.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.119.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.12.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.12.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.12.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.12.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.12.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.12.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.12.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.12.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.12.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.120.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.120.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.120.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.120.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.120.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.120.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.120.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.120.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.120.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.121.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.121.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.121.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.121.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.121.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.121.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.121.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.121.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.121.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.122.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.122.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.122.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.122.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.122.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.122.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.122.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.122.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.122.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.123.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.123.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.123.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.123.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.123.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.123.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.123.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.123.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.123.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.124.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.124.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.124.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.124.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.124.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.124.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.124.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.124.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.124.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.125.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.125.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.125.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.125.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.125.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.125.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.125.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.125.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.125.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.126.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.126.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.126.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.126.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.126.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.126.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.126.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.126.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.126.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.127.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.127.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.127.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.127.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.127.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.127.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.127.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.127.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.127.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.13.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.13.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.13.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.13.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.13.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.13.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.13.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.13.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.13.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.14.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.14.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.14.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.14.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.14.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.14.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.14.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.14.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.14.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.15.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.15.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.15.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.15.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.15.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.15.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.15.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.15.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.15.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.16.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.16.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.16.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.16.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.16.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.16.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.16.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.16.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.16.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.17.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.17.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.17.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.17.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.17.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.17.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.17.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.17.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.17.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.18.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.18.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.18.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.18.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.18.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.18.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.18.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.18.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.18.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.19.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.19.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.19.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.19.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.19.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.19.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.19.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.19.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.19.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.2.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.2.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.2.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.2.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.2.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.2.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.2.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.2.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.2.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.20.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.20.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.20.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.20.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.20.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.20.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.20.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.20.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.20.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.21.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.21.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.21.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.21.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.21.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.21.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.21.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.21.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.21.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.22.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.22.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.22.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.22.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.22.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.22.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.22.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.22.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.22.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.23.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.23.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.23.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.23.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.23.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.23.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.23.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.23.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.23.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.24.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.24.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.24.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.24.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.24.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.24.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.24.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.24.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.24.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.25.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.25.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.25.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.25.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.25.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.25.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.25.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.25.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.25.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.26.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.26.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.26.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.26.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.26.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.26.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.26.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.26.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.26.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.27.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.27.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.27.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.27.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.27.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.27.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.27.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.27.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.27.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.28.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.28.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.28.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.28.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.28.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.28.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.28.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.28.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.28.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.29.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.29.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.29.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.29.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.29.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.29.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.29.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.29.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.29.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.3.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.3.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.3.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.3.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.3.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.3.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.3.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.3.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.3.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.30.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.30.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.30.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.30.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.30.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.30.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.30.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.30.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.30.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.31.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.31.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.31.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.31.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.31.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.31.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.31.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.31.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.31.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.32.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.32.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.32.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.32.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.32.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.32.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.32.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.32.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.32.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.33.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.33.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.33.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.33.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.33.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.33.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.33.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.33.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.33.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.34.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.34.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.34.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.34.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.34.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.34.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.34.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.34.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.34.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.35.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.35.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.35.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.35.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.35.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.35.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.35.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.35.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.35.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.36.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.36.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.36.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.36.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.36.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.36.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.36.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.36.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.36.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.37.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.37.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.37.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.37.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.37.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.37.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.37.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.37.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.37.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.38.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.38.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.38.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.38.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.38.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.38.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.38.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.38.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.38.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.39.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.39.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.39.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.39.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.39.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.39.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.39.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.39.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.39.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.4.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.4.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.4.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.4.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.4.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.4.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.4.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.4.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.4.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.40.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.40.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.40.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.40.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.40.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.40.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.40.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.40.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.40.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.41.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.41.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.41.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.41.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.41.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.41.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.41.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.41.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.41.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.42.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.42.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.42.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.42.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.42.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.42.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.42.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.42.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.42.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.43.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.43.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.43.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.43.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.43.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.43.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.43.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.43.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.43.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.44.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.44.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.44.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.44.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.44.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.44.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.44.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.44.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.44.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.45.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.45.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.45.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.45.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.45.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.45.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.45.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.45.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.45.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.46.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.46.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.46.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.46.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.46.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.46.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.46.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.46.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.46.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.47.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.47.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.47.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.47.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.47.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.47.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.47.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.47.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.47.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.48.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.48.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.48.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.48.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.48.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.48.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.48.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.48.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.48.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.49.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.49.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.49.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.49.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.49.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.49.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.49.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.49.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.49.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.5.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.5.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.5.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.5.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.5.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.5.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.5.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.5.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.5.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.50.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.50.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.50.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.50.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.50.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.50.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.50.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.50.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.50.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.51.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.51.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.51.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.51.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.51.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.51.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.51.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.51.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.51.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.52.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.52.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.52.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.52.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.52.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.52.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.52.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.52.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.52.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.53.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.53.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.53.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.53.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.53.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.53.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.53.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.53.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.53.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.54.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.54.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.54.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.54.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.54.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.54.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.54.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.54.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.54.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.55.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.55.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.55.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.55.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.55.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.55.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.55.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.55.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.55.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.56.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.56.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.56.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.56.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.56.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.56.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.56.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.56.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.56.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.57.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.57.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.57.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.57.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.57.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.57.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.57.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.57.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.57.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.58.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.58.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.58.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.58.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.58.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.58.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.58.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.58.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.58.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.59.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.59.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.59.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.59.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.59.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.59.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.59.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.59.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.59.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.6.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.6.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.6.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.6.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.6.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.6.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.6.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.6.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.6.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.60.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.60.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.60.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.60.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.60.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.60.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.60.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.60.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.60.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.61.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.61.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.61.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.61.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.61.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.61.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.61.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.61.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.61.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.62.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.62.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.62.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.62.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.62.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.62.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.62.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.62.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.62.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.63.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.63.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.63.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.63.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.63.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.63.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.63.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.63.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.63.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.64.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.64.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.64.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.64.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.64.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.64.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.64.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.64.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.64.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.65.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.65.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.65.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.65.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.65.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.65.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.65.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.65.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.65.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.66.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.66.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.66.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.66.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.66.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.66.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.66.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.66.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.66.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.67.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.67.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.67.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.67.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.67.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.67.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.67.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.67.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.67.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.68.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.68.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.68.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.68.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.68.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.68.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.68.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.68.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.68.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.69.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.69.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.69.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.69.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.69.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.69.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.69.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.69.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.69.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.7.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.7.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.7.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.7.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.7.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.7.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.7.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.7.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.7.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.70.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.70.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.70.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.70.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.70.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.70.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.70.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.70.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.70.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.71.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.71.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.71.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.71.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.71.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.71.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.71.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.71.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.71.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.72.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.72.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.72.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.72.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.72.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.72.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.72.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.72.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.72.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.73.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.73.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.73.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.73.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.73.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.73.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.73.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.73.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.73.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.74.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.74.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.74.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.74.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.74.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.74.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.74.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.74.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.74.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.75.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.75.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.75.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.75.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.75.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.75.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.75.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.75.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.75.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.76.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.76.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.76.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.76.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.76.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.76.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.76.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.76.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.76.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.77.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.77.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.77.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.77.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.77.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.77.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.77.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.77.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.77.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.78.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.78.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.78.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.78.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.78.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.78.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.78.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.78.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.78.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.79.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.79.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.79.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.79.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.79.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.79.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.79.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.79.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.79.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.8.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.8.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.8.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.8.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.8.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.8.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.8.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.8.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.8.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.80.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.80.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.80.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.80.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.80.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.80.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.80.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.80.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.80.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.81.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.81.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.81.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.81.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.81.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.81.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.81.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.81.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.81.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.82.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.82.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.82.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.82.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.82.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.82.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.82.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.82.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.82.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.83.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.83.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.83.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.83.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.83.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.83.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.83.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.83.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.83.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.84.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.84.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.84.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.84.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.84.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.84.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.84.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.84.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.84.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.85.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.85.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.85.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.85.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.85.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.85.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.85.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.85.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.85.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.86.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.86.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.86.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.86.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.86.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.86.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.86.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.86.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.86.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.87.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.87.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.87.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.87.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.87.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.87.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.87.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.87.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.87.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.88.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.88.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.88.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.88.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.88.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.88.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.88.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.88.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.88.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.89.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.89.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.89.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.89.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.89.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.89.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.89.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.89.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.89.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.9.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.9.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.9.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.9.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.9.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.9.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.9.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.9.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.9.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.90.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.90.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.90.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.90.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.90.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.90.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.90.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.90.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.90.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.91.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.91.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.91.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.91.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.91.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.91.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.91.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.91.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.91.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.92.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.92.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.92.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.92.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.92.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.92.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.92.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.92.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.92.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.93.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.93.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.93.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.93.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.93.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.93.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.93.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.93.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.93.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.94.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.94.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.94.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.94.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.94.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.94.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.94.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.94.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.94.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.95.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.95.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.95.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.95.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.95.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.95.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.95.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.95.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.95.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.96.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.96.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.96.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.96.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.96.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.96.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.96.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.96.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.96.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.97.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.97.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.97.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.97.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.97.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.97.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.97.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.97.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.97.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.98.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.98.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.98.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.98.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.98.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.98.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.98.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.98.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.98.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.99.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.99.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.99.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.99.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.99.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.99.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.99.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.experts.99.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.experts.99.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.ffn_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.32.gate.weight": "consolidated-00009-of-00013.safetensors", "layers.32.shared_experts.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.shared_experts.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.shared_experts.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.shared_experts.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.shared_experts.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.shared_experts.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.32.shared_experts.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.32.shared_experts.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.32.shared_experts.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.attention.kv_a_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.33.attention.q_a_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.33.attention.wkv_a_with_mqa.weight": "consolidated-00009-of-00013.safetensors", "layers.33.attention.wkv_b.weight": "consolidated-00009-of-00013.safetensors", "layers.33.attention.wo.weight": "consolidated-00009-of-00013.safetensors", "layers.33.attention.wq_a.weight": "consolidated-00009-of-00013.safetensors", "layers.33.attention.wq_b.weight": "consolidated-00009-of-00013.safetensors", "layers.33.attention_norm.weight": "consolidated-00009-of-00013.safetensors", "layers.33.experts.0.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.0.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.0.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.0.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.0.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.0.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.0.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.0.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.0.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.1.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.1.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.1.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.1.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.1.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.1.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.1.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.1.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.1.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.10.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.10.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.10.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.10.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.10.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.10.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.10.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.10.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.10.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.100.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.100.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.100.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.100.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.100.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.100.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.100.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.100.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.100.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.101.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.101.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.101.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.101.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.101.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.101.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.101.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.101.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.101.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.102.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.102.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.102.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.102.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.102.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.102.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.102.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.102.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.102.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.103.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.103.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.103.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.103.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.103.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.103.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.103.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.103.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.103.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.104.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.104.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.104.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.104.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.104.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.104.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.104.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.104.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.104.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.105.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.105.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.105.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.105.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.105.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.105.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.105.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.105.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.105.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.106.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.106.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.106.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.106.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.106.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.106.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.106.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.106.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.106.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.107.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.107.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.107.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.107.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.107.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.107.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.107.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.107.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.107.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.108.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.108.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.108.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.108.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.108.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.108.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.108.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.108.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.108.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.109.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.109.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.109.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.109.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.109.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.109.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.109.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.109.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.109.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.11.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.11.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.11.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.11.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.11.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.11.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.11.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.11.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.11.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.110.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.110.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.110.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.110.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.110.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.110.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.110.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.110.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.110.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.111.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.111.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.111.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.111.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.111.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.111.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.111.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.111.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.111.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.112.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.112.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.112.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.112.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.112.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.112.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.112.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.112.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.112.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.113.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.113.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.113.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.113.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.113.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.113.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.113.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.113.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.113.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.114.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.114.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.114.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.114.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.114.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.114.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.114.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.114.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.114.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.115.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.115.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.115.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.115.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.115.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.115.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.115.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.115.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.115.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.116.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.116.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.116.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.116.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.116.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.116.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.116.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.116.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.116.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.117.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.117.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.117.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.117.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.117.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.117.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.117.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.117.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.117.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.118.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.118.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.118.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.118.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.118.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.118.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.118.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.118.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.118.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.119.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.119.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.119.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.119.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.119.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.119.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.119.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.119.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.119.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.12.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.12.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.12.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.12.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.12.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.12.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.12.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.12.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.12.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.120.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.120.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.120.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.120.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.120.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.120.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.120.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.120.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.120.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.121.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.121.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.121.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.121.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.121.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.121.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.121.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.121.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.121.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.122.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.122.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.122.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.122.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.122.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.122.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.122.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.122.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.122.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.123.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.123.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.123.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.123.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.123.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.123.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.123.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.123.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.123.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.124.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.124.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.124.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.124.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.124.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.124.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.124.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.124.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.124.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.125.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.125.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.125.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.125.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.125.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.125.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.125.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.125.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.125.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.126.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.126.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.126.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.126.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.126.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.126.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.126.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.126.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.126.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.127.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.127.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.127.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.127.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.127.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.127.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.127.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.127.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.127.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.13.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.13.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.13.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.13.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.13.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.13.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.13.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.13.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.13.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.14.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.14.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.14.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.14.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.14.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.14.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.14.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.14.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.14.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.15.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.15.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.15.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.15.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.15.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.15.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.15.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.15.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.15.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.16.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.16.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.16.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.16.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.16.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.16.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.16.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.16.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.16.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.17.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.17.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.17.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.17.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.17.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.17.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.17.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.17.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.17.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.18.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.18.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.18.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.18.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.18.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.18.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.18.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.18.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.18.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.19.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.19.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.19.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.19.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.19.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.19.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.19.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.19.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.19.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.2.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.2.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.2.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.2.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.2.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.2.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.2.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.2.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.2.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.20.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.20.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.20.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.20.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.20.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.20.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.20.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.20.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.20.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.21.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.21.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.21.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.21.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.21.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.21.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.21.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.21.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.21.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.22.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.22.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.22.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.22.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.22.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.22.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.22.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.22.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.22.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.23.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.23.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.23.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.23.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.23.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.23.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.23.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.23.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.23.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.24.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.24.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.24.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.24.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.24.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.24.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.24.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.24.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.24.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.25.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.25.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.25.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.25.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.25.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.25.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.25.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.25.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.25.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.26.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.26.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.26.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.26.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.26.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.26.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.26.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.26.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.26.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.27.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.27.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.27.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.27.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.27.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.27.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.27.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.27.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.27.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.28.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.28.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.28.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.28.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.28.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.28.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.28.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.28.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.28.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.29.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.29.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.29.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.29.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.29.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.29.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.29.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.29.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.29.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.3.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.3.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.3.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.3.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.3.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.3.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.3.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.3.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.3.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.30.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.30.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.30.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.30.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.30.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.30.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.30.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.30.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.30.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.31.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.31.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.31.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.31.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.31.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.31.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.31.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.31.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.31.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.32.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.32.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.32.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.32.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.32.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.32.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.32.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.32.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.32.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.33.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.33.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.33.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.33.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.33.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.33.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.33.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.33.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.33.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.34.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.34.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.34.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.34.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.34.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.34.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.34.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.34.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.34.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.35.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.35.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.35.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.35.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.35.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.35.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.35.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.35.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.35.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.36.w1.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.36.w1.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.36.w1.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.36.w2.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.36.w2.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.36.w2.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.36.w3.weight_global_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.36.w3.weight_packed": "consolidated-00009-of-00013.safetensors", "layers.33.experts.36.w3.weight_scale": "consolidated-00009-of-00013.safetensors", "layers.33.experts.37.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.37.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.37.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.37.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.37.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.37.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.37.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.37.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.37.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.38.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.38.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.38.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.38.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.38.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.38.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.38.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.38.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.38.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.39.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.39.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.39.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.39.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.39.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.39.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.39.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.39.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.39.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.4.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.4.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.4.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.4.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.4.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.4.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.4.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.4.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.4.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.40.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.40.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.40.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.40.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.40.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.40.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.40.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.40.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.40.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.41.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.41.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.41.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.41.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.41.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.41.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.41.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.41.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.41.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.42.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.42.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.42.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.42.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.42.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.42.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.42.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.42.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.42.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.43.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.43.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.43.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.43.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.43.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.43.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.43.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.43.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.43.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.44.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.44.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.44.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.44.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.44.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.44.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.44.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.44.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.44.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.45.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.45.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.45.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.45.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.45.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.45.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.45.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.45.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.45.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.46.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.46.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.46.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.46.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.46.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.46.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.46.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.46.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.46.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.47.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.47.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.47.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.47.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.47.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.47.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.47.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.47.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.47.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.48.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.48.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.48.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.48.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.48.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.48.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.48.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.48.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.48.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.49.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.49.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.49.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.49.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.49.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.49.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.49.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.49.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.49.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.5.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.5.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.5.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.5.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.5.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.5.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.5.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.5.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.5.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.50.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.50.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.50.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.50.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.50.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.50.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.50.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.50.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.50.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.51.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.51.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.51.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.51.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.51.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.51.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.51.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.51.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.51.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.52.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.52.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.52.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.52.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.52.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.52.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.52.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.52.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.52.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.53.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.53.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.53.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.53.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.53.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.53.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.53.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.53.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.53.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.54.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.54.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.54.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.54.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.54.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.54.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.54.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.54.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.54.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.55.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.55.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.55.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.55.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.55.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.55.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.55.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.55.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.55.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.56.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.56.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.56.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.56.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.56.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.56.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.56.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.56.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.56.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.57.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.57.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.57.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.57.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.57.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.57.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.57.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.57.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.57.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.58.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.58.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.58.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.58.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.58.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.58.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.58.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.58.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.58.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.59.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.59.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.59.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.59.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.59.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.59.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.59.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.59.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.59.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.6.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.6.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.6.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.6.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.6.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.6.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.6.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.6.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.6.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.60.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.60.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.60.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.60.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.60.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.60.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.60.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.60.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.60.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.61.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.61.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.61.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.61.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.61.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.61.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.61.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.61.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.61.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.62.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.62.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.62.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.62.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.62.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.62.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.62.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.62.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.62.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.63.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.63.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.63.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.63.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.63.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.63.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.63.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.63.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.63.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.64.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.64.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.64.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.64.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.64.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.64.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.64.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.64.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.64.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.65.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.65.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.65.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.65.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.65.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.65.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.65.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.65.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.65.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.66.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.66.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.66.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.66.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.66.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.66.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.66.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.66.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.66.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.67.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.67.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.67.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.67.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.67.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.67.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.67.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.67.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.67.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.68.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.68.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.68.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.68.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.68.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.68.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.68.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.68.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.68.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.69.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.69.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.69.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.69.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.69.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.69.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.69.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.69.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.69.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.7.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.7.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.7.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.7.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.7.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.7.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.7.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.7.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.7.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.70.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.70.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.70.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.70.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.70.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.70.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.70.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.70.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.70.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.71.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.71.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.71.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.71.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.71.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.71.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.71.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.71.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.71.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.72.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.72.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.72.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.72.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.72.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.72.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.72.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.72.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.72.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.73.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.73.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.73.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.73.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.73.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.73.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.73.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.73.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.73.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.74.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.74.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.74.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.74.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.74.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.74.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.74.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.74.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.74.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.75.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.75.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.75.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.75.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.75.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.75.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.75.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.75.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.75.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.76.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.76.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.76.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.76.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.76.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.76.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.76.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.76.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.76.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.77.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.77.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.77.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.77.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.77.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.77.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.77.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.77.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.77.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.78.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.78.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.78.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.78.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.78.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.78.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.78.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.78.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.78.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.79.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.79.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.79.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.79.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.79.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.79.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.79.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.79.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.79.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.8.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.8.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.8.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.8.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.8.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.8.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.8.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.8.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.8.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.80.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.80.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.80.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.80.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.80.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.80.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.80.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.80.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.80.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.81.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.81.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.81.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.81.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.81.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.81.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.81.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.81.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.81.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.82.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.82.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.82.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.82.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.82.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.82.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.82.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.82.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.82.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.83.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.83.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.83.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.83.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.83.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.83.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.83.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.83.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.83.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.84.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.84.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.84.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.84.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.84.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.84.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.84.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.84.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.84.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.85.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.85.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.85.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.85.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.85.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.85.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.85.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.85.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.85.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.86.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.86.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.86.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.86.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.86.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.86.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.86.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.86.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.86.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.87.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.87.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.87.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.87.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.87.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.87.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.87.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.87.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.87.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.88.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.88.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.88.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.88.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.88.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.88.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.88.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.88.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.88.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.89.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.89.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.89.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.89.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.89.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.89.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.89.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.89.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.89.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.9.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.9.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.9.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.9.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.9.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.9.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.9.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.9.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.9.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.90.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.90.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.90.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.90.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.90.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.90.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.90.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.90.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.90.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.91.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.91.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.91.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.91.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.91.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.91.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.91.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.91.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.91.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.92.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.92.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.92.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.92.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.92.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.92.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.92.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.92.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.92.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.93.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.93.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.93.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.93.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.93.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.93.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.93.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.93.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.93.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.94.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.94.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.94.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.94.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.94.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.94.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.94.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.94.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.94.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.95.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.95.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.95.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.95.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.95.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.95.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.95.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.95.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.95.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.96.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.96.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.96.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.96.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.96.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.96.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.96.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.96.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.96.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.97.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.97.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.97.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.97.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.97.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.97.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.97.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.97.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.97.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.98.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.98.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.98.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.98.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.98.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.98.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.98.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.98.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.98.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.99.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.99.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.99.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.99.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.99.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.99.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.99.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.experts.99.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.experts.99.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.ffn_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.33.gate.weight": "consolidated-00010-of-00013.safetensors", "layers.33.shared_experts.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.shared_experts.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.shared_experts.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.shared_experts.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.shared_experts.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.shared_experts.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.33.shared_experts.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.33.shared_experts.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.33.shared_experts.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.attention.kv_a_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.34.attention.q_a_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.34.attention.wkv_a_with_mqa.weight": "consolidated-00010-of-00013.safetensors", "layers.34.attention.wkv_b.weight": "consolidated-00010-of-00013.safetensors", "layers.34.attention.wo.weight": "consolidated-00010-of-00013.safetensors", "layers.34.attention.wq_a.weight": "consolidated-00010-of-00013.safetensors", "layers.34.attention.wq_b.weight": "consolidated-00010-of-00013.safetensors", "layers.34.attention_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.34.experts.0.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.0.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.0.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.0.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.0.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.0.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.0.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.0.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.0.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.1.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.1.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.1.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.1.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.1.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.1.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.1.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.1.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.1.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.10.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.10.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.10.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.10.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.10.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.10.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.10.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.10.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.10.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.100.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.100.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.100.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.100.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.100.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.100.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.100.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.100.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.100.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.101.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.101.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.101.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.101.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.101.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.101.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.101.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.101.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.101.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.102.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.102.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.102.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.102.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.102.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.102.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.102.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.102.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.102.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.103.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.103.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.103.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.103.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.103.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.103.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.103.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.103.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.103.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.104.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.104.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.104.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.104.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.104.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.104.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.104.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.104.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.104.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.105.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.105.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.105.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.105.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.105.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.105.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.105.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.105.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.105.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.106.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.106.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.106.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.106.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.106.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.106.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.106.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.106.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.106.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.107.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.107.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.107.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.107.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.107.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.107.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.107.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.107.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.107.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.108.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.108.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.108.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.108.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.108.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.108.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.108.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.108.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.108.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.109.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.109.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.109.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.109.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.109.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.109.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.109.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.109.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.109.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.11.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.11.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.11.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.11.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.11.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.11.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.11.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.11.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.11.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.110.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.110.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.110.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.110.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.110.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.110.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.110.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.110.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.110.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.111.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.111.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.111.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.111.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.111.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.111.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.111.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.111.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.111.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.112.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.112.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.112.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.112.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.112.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.112.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.112.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.112.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.112.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.113.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.113.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.113.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.113.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.113.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.113.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.113.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.113.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.113.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.114.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.114.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.114.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.114.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.114.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.114.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.114.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.114.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.114.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.115.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.115.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.115.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.115.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.115.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.115.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.115.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.115.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.115.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.116.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.116.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.116.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.116.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.116.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.116.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.116.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.116.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.116.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.117.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.117.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.117.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.117.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.117.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.117.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.117.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.117.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.117.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.118.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.118.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.118.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.118.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.118.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.118.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.118.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.118.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.118.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.119.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.119.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.119.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.119.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.119.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.119.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.119.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.119.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.119.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.12.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.12.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.12.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.12.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.12.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.12.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.12.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.12.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.12.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.120.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.120.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.120.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.120.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.120.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.120.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.120.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.120.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.120.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.121.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.121.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.121.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.121.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.121.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.121.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.121.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.121.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.121.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.122.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.122.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.122.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.122.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.122.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.122.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.122.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.122.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.122.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.123.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.123.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.123.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.123.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.123.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.123.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.123.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.123.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.123.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.124.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.124.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.124.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.124.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.124.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.124.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.124.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.124.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.124.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.125.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.125.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.125.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.125.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.125.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.125.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.125.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.125.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.125.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.126.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.126.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.126.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.126.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.126.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.126.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.126.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.126.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.126.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.127.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.127.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.127.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.127.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.127.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.127.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.127.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.127.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.127.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.13.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.13.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.13.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.13.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.13.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.13.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.13.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.13.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.13.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.14.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.14.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.14.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.14.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.14.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.14.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.14.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.14.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.14.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.15.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.15.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.15.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.15.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.15.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.15.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.15.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.15.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.15.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.16.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.16.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.16.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.16.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.16.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.16.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.16.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.16.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.16.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.17.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.17.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.17.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.17.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.17.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.17.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.17.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.17.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.17.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.18.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.18.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.18.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.18.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.18.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.18.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.18.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.18.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.18.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.19.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.19.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.19.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.19.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.19.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.19.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.19.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.19.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.19.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.2.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.2.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.2.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.2.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.2.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.2.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.2.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.2.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.2.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.20.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.20.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.20.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.20.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.20.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.20.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.20.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.20.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.20.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.21.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.21.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.21.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.21.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.21.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.21.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.21.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.21.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.21.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.22.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.22.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.22.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.22.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.22.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.22.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.22.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.22.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.22.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.23.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.23.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.23.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.23.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.23.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.23.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.23.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.23.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.23.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.24.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.24.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.24.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.24.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.24.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.24.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.24.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.24.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.24.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.25.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.25.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.25.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.25.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.25.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.25.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.25.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.25.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.25.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.26.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.26.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.26.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.26.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.26.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.26.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.26.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.26.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.26.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.27.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.27.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.27.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.27.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.27.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.27.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.27.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.27.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.27.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.28.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.28.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.28.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.28.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.28.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.28.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.28.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.28.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.28.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.29.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.29.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.29.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.29.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.29.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.29.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.29.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.29.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.29.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.3.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.3.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.3.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.3.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.3.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.3.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.3.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.3.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.3.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.30.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.30.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.30.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.30.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.30.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.30.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.30.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.30.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.30.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.31.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.31.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.31.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.31.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.31.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.31.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.31.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.31.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.31.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.32.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.32.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.32.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.32.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.32.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.32.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.32.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.32.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.32.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.33.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.33.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.33.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.33.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.33.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.33.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.33.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.33.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.33.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.34.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.34.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.34.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.34.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.34.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.34.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.34.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.34.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.34.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.35.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.35.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.35.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.35.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.35.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.35.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.35.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.35.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.35.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.36.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.36.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.36.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.36.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.36.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.36.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.36.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.36.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.36.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.37.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.37.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.37.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.37.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.37.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.37.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.37.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.37.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.37.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.38.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.38.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.38.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.38.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.38.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.38.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.38.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.38.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.38.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.39.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.39.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.39.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.39.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.39.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.39.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.39.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.39.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.39.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.4.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.4.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.4.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.4.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.4.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.4.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.4.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.4.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.4.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.40.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.40.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.40.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.40.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.40.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.40.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.40.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.40.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.40.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.41.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.41.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.41.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.41.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.41.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.41.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.41.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.41.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.41.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.42.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.42.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.42.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.42.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.42.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.42.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.42.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.42.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.42.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.43.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.43.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.43.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.43.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.43.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.43.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.43.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.43.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.43.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.44.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.44.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.44.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.44.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.44.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.44.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.44.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.44.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.44.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.45.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.45.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.45.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.45.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.45.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.45.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.45.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.45.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.45.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.46.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.46.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.46.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.46.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.46.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.46.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.46.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.46.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.46.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.47.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.47.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.47.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.47.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.47.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.47.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.47.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.47.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.47.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.48.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.48.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.48.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.48.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.48.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.48.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.48.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.48.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.48.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.49.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.49.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.49.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.49.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.49.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.49.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.49.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.49.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.49.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.5.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.5.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.5.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.5.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.5.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.5.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.5.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.5.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.5.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.50.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.50.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.50.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.50.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.50.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.50.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.50.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.50.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.50.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.51.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.51.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.51.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.51.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.51.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.51.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.51.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.51.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.51.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.52.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.52.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.52.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.52.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.52.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.52.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.52.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.52.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.52.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.53.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.53.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.53.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.53.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.53.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.53.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.53.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.53.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.53.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.54.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.54.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.54.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.54.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.54.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.54.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.54.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.54.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.54.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.55.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.55.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.55.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.55.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.55.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.55.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.55.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.55.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.55.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.56.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.56.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.56.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.56.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.56.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.56.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.56.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.56.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.56.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.57.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.57.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.57.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.57.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.57.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.57.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.57.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.57.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.57.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.58.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.58.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.58.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.58.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.58.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.58.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.58.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.58.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.58.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.59.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.59.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.59.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.59.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.59.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.59.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.59.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.59.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.59.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.6.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.6.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.6.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.6.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.6.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.6.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.6.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.6.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.6.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.60.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.60.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.60.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.60.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.60.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.60.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.60.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.60.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.60.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.61.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.61.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.61.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.61.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.61.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.61.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.61.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.61.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.61.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.62.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.62.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.62.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.62.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.62.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.62.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.62.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.62.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.62.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.63.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.63.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.63.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.63.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.63.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.63.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.63.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.63.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.63.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.64.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.64.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.64.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.64.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.64.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.64.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.64.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.64.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.64.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.65.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.65.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.65.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.65.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.65.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.65.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.65.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.65.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.65.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.66.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.66.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.66.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.66.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.66.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.66.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.66.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.66.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.66.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.67.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.67.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.67.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.67.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.67.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.67.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.67.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.67.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.67.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.68.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.68.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.68.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.68.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.68.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.68.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.68.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.68.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.68.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.69.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.69.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.69.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.69.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.69.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.69.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.69.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.69.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.69.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.7.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.7.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.7.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.7.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.7.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.7.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.7.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.7.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.7.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.70.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.70.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.70.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.70.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.70.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.70.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.70.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.70.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.70.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.71.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.71.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.71.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.71.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.71.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.71.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.71.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.71.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.71.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.72.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.72.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.72.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.72.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.72.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.72.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.72.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.72.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.72.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.73.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.73.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.73.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.73.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.73.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.73.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.73.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.73.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.73.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.74.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.74.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.74.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.74.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.74.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.74.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.74.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.74.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.74.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.75.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.75.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.75.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.75.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.75.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.75.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.75.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.75.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.75.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.76.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.76.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.76.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.76.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.76.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.76.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.76.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.76.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.76.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.77.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.77.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.77.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.77.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.77.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.77.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.77.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.77.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.77.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.78.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.78.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.78.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.78.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.78.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.78.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.78.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.78.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.78.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.79.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.79.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.79.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.79.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.79.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.79.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.79.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.79.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.79.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.8.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.8.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.8.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.8.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.8.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.8.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.8.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.8.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.8.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.80.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.80.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.80.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.80.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.80.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.80.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.80.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.80.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.80.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.81.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.81.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.81.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.81.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.81.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.81.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.81.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.81.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.81.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.82.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.82.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.82.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.82.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.82.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.82.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.82.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.82.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.82.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.83.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.83.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.83.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.83.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.83.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.83.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.83.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.83.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.83.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.84.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.84.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.84.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.84.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.84.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.84.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.84.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.84.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.84.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.85.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.85.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.85.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.85.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.85.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.85.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.85.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.85.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.85.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.86.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.86.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.86.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.86.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.86.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.86.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.86.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.86.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.86.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.87.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.87.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.87.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.87.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.87.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.87.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.87.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.87.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.87.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.88.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.88.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.88.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.88.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.88.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.88.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.88.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.88.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.88.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.89.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.89.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.89.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.89.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.89.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.89.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.89.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.89.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.89.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.9.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.9.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.9.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.9.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.9.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.9.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.9.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.9.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.9.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.90.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.90.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.90.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.90.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.90.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.90.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.90.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.90.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.90.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.91.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.91.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.91.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.91.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.91.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.91.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.91.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.91.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.91.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.92.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.92.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.92.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.92.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.92.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.92.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.92.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.92.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.92.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.93.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.93.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.93.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.93.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.93.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.93.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.93.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.93.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.93.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.94.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.94.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.94.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.94.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.94.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.94.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.94.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.94.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.94.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.95.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.95.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.95.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.95.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.95.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.95.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.95.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.95.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.95.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.96.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.96.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.96.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.96.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.96.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.96.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.96.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.96.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.96.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.97.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.97.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.97.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.97.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.97.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.97.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.97.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.97.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.97.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.98.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.98.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.98.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.98.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.98.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.98.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.98.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.98.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.98.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.99.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.99.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.99.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.99.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.99.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.99.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.99.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.experts.99.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.experts.99.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.ffn_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.34.gate.weight": "consolidated-00010-of-00013.safetensors", "layers.34.shared_experts.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.shared_experts.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.shared_experts.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.shared_experts.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.shared_experts.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.shared_experts.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.34.shared_experts.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.34.shared_experts.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.34.shared_experts.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.attention.kv_a_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.35.attention.q_a_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.35.attention.wkv_a_with_mqa.weight": "consolidated-00010-of-00013.safetensors", "layers.35.attention.wkv_b.weight": "consolidated-00010-of-00013.safetensors", "layers.35.attention.wo.weight": "consolidated-00010-of-00013.safetensors", "layers.35.attention.wq_a.weight": "consolidated-00010-of-00013.safetensors", "layers.35.attention.wq_b.weight": "consolidated-00010-of-00013.safetensors", "layers.35.attention_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.35.experts.0.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.0.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.0.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.0.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.0.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.0.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.0.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.0.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.0.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.1.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.1.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.1.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.1.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.1.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.1.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.1.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.1.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.1.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.10.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.10.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.10.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.10.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.10.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.10.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.10.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.10.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.10.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.100.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.100.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.100.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.100.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.100.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.100.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.100.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.100.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.100.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.101.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.101.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.101.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.101.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.101.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.101.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.101.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.101.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.101.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.102.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.102.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.102.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.102.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.102.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.102.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.102.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.102.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.102.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.103.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.103.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.103.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.103.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.103.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.103.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.103.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.103.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.103.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.104.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.104.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.104.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.104.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.104.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.104.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.104.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.104.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.104.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.105.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.105.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.105.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.105.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.105.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.105.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.105.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.105.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.105.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.106.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.106.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.106.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.106.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.106.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.106.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.106.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.106.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.106.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.107.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.107.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.107.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.107.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.107.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.107.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.107.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.107.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.107.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.108.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.108.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.108.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.108.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.108.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.108.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.108.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.108.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.108.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.109.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.109.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.109.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.109.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.109.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.109.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.109.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.109.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.109.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.11.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.11.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.11.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.11.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.11.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.11.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.11.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.11.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.11.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.110.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.110.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.110.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.110.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.110.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.110.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.110.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.110.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.110.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.111.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.111.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.111.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.111.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.111.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.111.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.111.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.111.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.111.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.112.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.112.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.112.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.112.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.112.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.112.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.112.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.112.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.112.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.113.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.113.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.113.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.113.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.113.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.113.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.113.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.113.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.113.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.114.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.114.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.114.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.114.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.114.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.114.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.114.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.114.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.114.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.115.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.115.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.115.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.115.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.115.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.115.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.115.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.115.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.115.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.116.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.116.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.116.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.116.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.116.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.116.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.116.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.116.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.116.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.117.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.117.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.117.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.117.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.117.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.117.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.117.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.117.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.117.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.118.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.118.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.118.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.118.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.118.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.118.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.118.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.118.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.118.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.119.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.119.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.119.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.119.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.119.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.119.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.119.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.119.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.119.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.12.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.12.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.12.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.12.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.12.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.12.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.12.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.12.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.12.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.120.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.120.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.120.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.120.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.120.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.120.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.120.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.120.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.120.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.121.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.121.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.121.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.121.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.121.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.121.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.121.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.121.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.121.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.122.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.122.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.122.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.122.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.122.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.122.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.122.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.122.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.122.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.123.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.123.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.123.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.123.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.123.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.123.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.123.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.123.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.123.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.124.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.124.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.124.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.124.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.124.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.124.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.124.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.124.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.124.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.125.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.125.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.125.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.125.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.125.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.125.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.125.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.125.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.125.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.126.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.126.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.126.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.126.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.126.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.126.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.126.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.126.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.126.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.127.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.127.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.127.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.127.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.127.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.127.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.127.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.127.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.127.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.13.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.13.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.13.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.13.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.13.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.13.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.13.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.13.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.13.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.14.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.14.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.14.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.14.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.14.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.14.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.14.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.14.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.14.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.15.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.15.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.15.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.15.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.15.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.15.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.15.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.15.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.15.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.16.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.16.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.16.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.16.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.16.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.16.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.16.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.16.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.16.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.17.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.17.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.17.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.17.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.17.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.17.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.17.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.17.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.17.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.18.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.18.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.18.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.18.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.18.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.18.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.18.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.18.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.18.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.19.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.19.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.19.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.19.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.19.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.19.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.19.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.19.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.19.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.2.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.2.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.2.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.2.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.2.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.2.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.2.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.2.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.2.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.20.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.20.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.20.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.20.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.20.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.20.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.20.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.20.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.20.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.21.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.21.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.21.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.21.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.21.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.21.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.21.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.21.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.21.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.22.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.22.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.22.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.22.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.22.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.22.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.22.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.22.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.22.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.23.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.23.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.23.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.23.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.23.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.23.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.23.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.23.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.23.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.24.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.24.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.24.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.24.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.24.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.24.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.24.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.24.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.24.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.25.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.25.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.25.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.25.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.25.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.25.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.25.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.25.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.25.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.26.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.26.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.26.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.26.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.26.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.26.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.26.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.26.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.26.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.27.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.27.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.27.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.27.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.27.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.27.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.27.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.27.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.27.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.28.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.28.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.28.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.28.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.28.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.28.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.28.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.28.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.28.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.29.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.29.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.29.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.29.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.29.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.29.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.29.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.29.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.29.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.3.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.3.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.3.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.3.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.3.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.3.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.3.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.3.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.3.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.30.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.30.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.30.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.30.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.30.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.30.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.30.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.30.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.30.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.31.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.31.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.31.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.31.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.31.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.31.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.31.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.31.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.31.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.32.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.32.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.32.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.32.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.32.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.32.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.32.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.32.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.32.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.33.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.33.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.33.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.33.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.33.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.33.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.33.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.33.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.33.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.34.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.34.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.34.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.34.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.34.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.34.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.34.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.34.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.34.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.35.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.35.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.35.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.35.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.35.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.35.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.35.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.35.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.35.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.36.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.36.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.36.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.36.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.36.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.36.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.36.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.36.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.36.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.37.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.37.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.37.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.37.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.37.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.37.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.37.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.37.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.37.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.38.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.38.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.38.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.38.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.38.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.38.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.38.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.38.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.38.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.39.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.39.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.39.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.39.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.39.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.39.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.39.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.39.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.39.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.4.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.4.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.4.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.4.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.4.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.4.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.4.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.4.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.4.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.40.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.40.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.40.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.40.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.40.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.40.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.40.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.40.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.40.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.41.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.41.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.41.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.41.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.41.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.41.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.41.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.41.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.41.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.42.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.42.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.42.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.42.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.42.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.42.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.42.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.42.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.42.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.43.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.43.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.43.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.43.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.43.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.43.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.43.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.43.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.43.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.44.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.44.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.44.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.44.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.44.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.44.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.44.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.44.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.44.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.45.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.45.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.45.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.45.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.45.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.45.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.45.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.45.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.45.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.46.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.46.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.46.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.46.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.46.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.46.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.46.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.46.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.46.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.47.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.47.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.47.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.47.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.47.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.47.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.47.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.47.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.47.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.48.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.48.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.48.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.48.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.48.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.48.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.48.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.48.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.48.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.49.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.49.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.49.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.49.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.49.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.49.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.49.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.49.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.49.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.5.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.5.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.5.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.5.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.5.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.5.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.5.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.5.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.5.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.50.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.50.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.50.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.50.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.50.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.50.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.50.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.50.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.50.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.51.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.51.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.51.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.51.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.51.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.51.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.51.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.51.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.51.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.52.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.52.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.52.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.52.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.52.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.52.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.52.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.52.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.52.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.53.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.53.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.53.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.53.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.53.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.53.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.53.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.53.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.53.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.54.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.54.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.54.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.54.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.54.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.54.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.54.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.54.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.54.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.55.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.55.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.55.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.55.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.55.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.55.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.55.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.55.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.55.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.56.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.56.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.56.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.56.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.56.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.56.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.56.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.56.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.56.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.57.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.57.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.57.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.57.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.57.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.57.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.57.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.57.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.57.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.58.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.58.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.58.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.58.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.58.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.58.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.58.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.58.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.58.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.59.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.59.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.59.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.59.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.59.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.59.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.59.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.59.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.59.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.6.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.6.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.6.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.6.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.6.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.6.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.6.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.6.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.6.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.60.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.60.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.60.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.60.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.60.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.60.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.60.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.60.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.60.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.61.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.61.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.61.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.61.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.61.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.61.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.61.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.61.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.61.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.62.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.62.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.62.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.62.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.62.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.62.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.62.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.62.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.62.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.63.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.63.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.63.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.63.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.63.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.63.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.63.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.63.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.63.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.64.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.64.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.64.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.64.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.64.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.64.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.64.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.64.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.64.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.65.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.65.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.65.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.65.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.65.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.65.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.65.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.65.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.65.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.66.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.66.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.66.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.66.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.66.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.66.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.66.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.66.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.66.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.67.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.67.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.67.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.67.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.67.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.67.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.67.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.67.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.67.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.68.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.68.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.68.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.68.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.68.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.68.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.68.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.68.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.68.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.69.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.69.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.69.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.69.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.69.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.69.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.69.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.69.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.69.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.7.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.7.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.7.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.7.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.7.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.7.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.7.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.7.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.7.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.70.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.70.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.70.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.70.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.70.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.70.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.70.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.70.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.70.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.71.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.71.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.71.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.71.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.71.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.71.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.71.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.71.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.71.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.72.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.72.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.72.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.72.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.72.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.72.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.72.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.72.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.72.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.73.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.73.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.73.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.73.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.73.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.73.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.73.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.73.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.73.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.74.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.74.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.74.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.74.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.74.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.74.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.74.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.74.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.74.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.75.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.75.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.75.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.75.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.75.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.75.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.75.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.75.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.75.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.76.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.76.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.76.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.76.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.76.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.76.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.76.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.76.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.76.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.77.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.77.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.77.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.77.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.77.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.77.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.77.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.77.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.77.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.78.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.78.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.78.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.78.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.78.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.78.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.78.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.78.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.78.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.79.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.79.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.79.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.79.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.79.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.79.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.79.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.79.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.79.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.8.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.8.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.8.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.8.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.8.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.8.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.8.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.8.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.8.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.80.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.80.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.80.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.80.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.80.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.80.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.80.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.80.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.80.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.81.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.81.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.81.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.81.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.81.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.81.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.81.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.81.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.81.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.82.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.82.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.82.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.82.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.82.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.82.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.82.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.82.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.82.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.83.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.83.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.83.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.83.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.83.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.83.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.83.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.83.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.83.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.84.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.84.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.84.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.84.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.84.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.84.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.84.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.84.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.84.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.85.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.85.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.85.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.85.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.85.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.85.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.85.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.85.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.85.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.86.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.86.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.86.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.86.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.86.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.86.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.86.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.86.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.86.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.87.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.87.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.87.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.87.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.87.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.87.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.87.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.87.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.87.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.88.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.88.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.88.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.88.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.88.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.88.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.88.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.88.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.88.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.89.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.89.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.89.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.89.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.89.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.89.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.89.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.89.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.89.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.9.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.9.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.9.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.9.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.9.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.9.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.9.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.9.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.9.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.90.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.90.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.90.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.90.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.90.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.90.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.90.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.90.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.90.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.91.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.91.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.91.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.91.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.91.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.91.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.91.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.91.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.91.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.92.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.92.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.92.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.92.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.92.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.92.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.92.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.92.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.92.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.93.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.93.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.93.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.93.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.93.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.93.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.93.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.93.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.93.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.94.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.94.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.94.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.94.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.94.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.94.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.94.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.94.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.94.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.95.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.95.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.95.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.95.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.95.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.95.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.95.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.95.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.95.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.96.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.96.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.96.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.96.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.96.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.96.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.96.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.96.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.96.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.97.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.97.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.97.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.97.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.97.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.97.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.97.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.97.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.97.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.98.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.98.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.98.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.98.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.98.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.98.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.98.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.98.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.98.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.99.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.99.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.99.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.99.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.99.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.99.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.99.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.experts.99.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.experts.99.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.ffn_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.35.gate.weight": "consolidated-00010-of-00013.safetensors", "layers.35.shared_experts.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.shared_experts.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.shared_experts.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.shared_experts.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.shared_experts.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.shared_experts.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.35.shared_experts.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.35.shared_experts.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.35.shared_experts.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.attention.kv_a_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.4.attention.q_a_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.4.attention.wkv_a_with_mqa.weight": "consolidated-00010-of-00013.safetensors", "layers.4.attention.wkv_b.weight": "consolidated-00010-of-00013.safetensors", "layers.4.attention.wo.weight": "consolidated-00010-of-00013.safetensors", "layers.4.attention.wq_a.weight": "consolidated-00010-of-00013.safetensors", "layers.4.attention.wq_b.weight": "consolidated-00010-of-00013.safetensors", "layers.4.attention_norm.weight": "consolidated-00010-of-00013.safetensors", "layers.4.experts.0.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.0.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.0.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.0.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.0.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.0.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.0.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.0.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.0.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.1.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.1.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.1.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.1.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.1.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.1.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.1.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.1.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.1.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.10.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.10.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.10.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.10.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.10.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.10.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.10.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.10.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.10.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.100.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.100.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.100.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.100.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.100.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.100.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.100.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.100.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.100.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.101.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.101.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.101.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.101.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.101.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.101.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.101.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.101.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.101.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.102.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.102.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.102.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.102.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.102.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.102.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.102.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.102.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.102.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.103.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.103.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.103.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.103.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.103.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.103.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.103.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.103.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.103.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.104.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.104.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.104.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.104.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.104.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.104.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.104.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.104.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.104.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.105.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.105.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.105.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.105.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.105.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.105.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.105.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.105.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.105.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.106.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.106.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.106.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.106.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.106.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.106.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.106.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.106.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.106.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.107.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.107.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.107.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.107.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.107.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.107.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.107.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.107.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.107.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.108.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.108.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.108.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.108.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.108.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.108.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.108.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.108.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.108.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.109.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.109.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.109.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.109.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.109.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.109.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.109.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.109.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.109.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.11.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.11.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.11.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.11.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.11.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.11.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.11.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.11.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.11.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.110.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.110.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.110.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.110.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.110.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.110.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.110.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.110.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.110.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.111.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.111.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.111.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.111.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.111.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.111.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.111.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.111.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.111.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.112.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.112.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.112.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.112.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.112.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.112.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.112.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.112.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.112.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.113.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.113.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.113.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.113.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.113.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.113.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.113.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.113.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.113.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.114.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.114.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.114.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.114.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.114.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.114.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.114.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.114.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.114.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.115.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.115.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.115.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.115.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.115.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.115.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.115.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.115.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.115.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.116.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.116.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.116.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.116.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.116.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.116.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.116.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.116.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.116.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.117.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.117.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.117.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.117.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.117.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.117.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.117.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.117.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.117.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.118.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.118.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.118.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.118.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.118.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.118.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.118.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.118.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.118.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.119.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.119.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.119.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.119.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.119.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.119.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.119.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.119.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.119.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.12.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.12.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.12.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.12.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.12.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.12.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.12.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.12.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.12.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.120.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.120.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.120.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.120.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.120.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.120.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.120.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.120.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.120.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.121.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.121.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.121.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.121.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.121.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.121.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.121.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.121.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.121.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.122.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.122.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.122.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.122.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.122.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.122.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.122.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.122.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.122.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.123.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.123.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.123.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.123.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.123.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.123.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.123.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.123.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.123.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.124.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.124.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.124.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.124.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.124.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.124.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.124.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.124.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.124.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.125.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.125.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.125.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.125.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.125.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.125.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.125.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.125.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.125.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.126.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.126.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.126.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.126.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.126.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.126.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.126.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.126.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.126.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.127.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.127.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.127.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.127.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.127.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.127.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.127.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.127.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.127.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.13.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.13.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.13.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.13.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.13.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.13.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.13.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.13.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.13.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.14.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.14.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.14.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.14.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.14.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.14.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.14.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.14.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.14.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.15.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.15.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.15.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.15.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.15.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.15.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.15.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.15.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.15.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.16.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.16.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.16.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.16.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.16.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.16.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.16.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.16.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.16.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.17.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.17.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.17.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.17.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.17.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.17.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.17.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.17.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.17.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.18.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.18.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.18.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.18.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.18.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.18.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.18.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.18.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.18.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.19.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.19.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.19.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.19.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.19.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.19.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.19.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.19.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.19.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.2.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.2.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.2.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.2.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.2.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.2.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.2.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.2.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.2.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.20.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.20.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.20.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.20.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.20.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.20.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.20.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.20.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.20.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.21.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.21.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.21.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.21.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.21.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.21.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.21.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.21.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.21.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.22.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.22.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.22.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.22.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.22.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.22.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.22.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.22.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.22.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.23.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.23.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.23.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.23.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.23.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.23.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.23.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.23.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.23.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.24.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.24.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.24.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.24.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.24.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.24.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.24.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.24.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.24.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.25.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.25.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.25.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.25.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.25.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.25.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.25.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.25.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.25.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.26.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.26.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.26.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.26.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.26.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.26.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.26.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.26.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.26.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.27.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.27.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.27.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.27.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.27.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.27.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.27.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.27.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.27.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.28.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.28.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.28.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.28.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.28.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.28.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.28.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.28.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.28.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.29.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.29.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.29.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.29.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.29.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.29.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.29.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.29.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.29.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.3.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.3.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.3.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.3.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.3.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.3.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.3.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.3.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.3.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.30.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.30.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.30.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.30.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.30.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.30.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.30.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.30.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.30.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.31.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.31.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.31.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.31.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.31.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.31.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.31.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.31.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.31.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.32.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.32.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.32.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.32.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.32.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.32.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.32.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.32.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.32.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.33.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.33.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.33.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.33.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.33.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.33.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.33.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.33.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.33.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.34.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.34.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.34.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.34.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.34.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.34.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.34.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.34.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.34.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.35.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.35.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.35.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.35.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.35.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.35.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.35.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.35.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.35.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.36.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.36.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.36.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.36.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.36.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.36.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.36.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.36.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.36.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.37.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.37.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.37.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.37.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.37.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.37.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.37.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.37.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.37.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.38.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.38.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.38.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.38.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.38.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.38.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.38.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.38.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.38.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.39.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.39.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.39.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.39.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.39.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.39.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.39.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.39.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.39.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.4.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.4.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.4.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.4.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.4.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.4.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.4.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.4.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.4.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.40.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.40.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.40.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.40.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.40.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.40.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.40.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.40.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.40.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.41.w1.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.41.w1.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.41.w1.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.41.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.41.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.41.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.41.w3.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.41.w3.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.41.w3.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.42.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.42.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.42.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.42.w2.weight_global_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.42.w2.weight_packed": "consolidated-00010-of-00013.safetensors", "layers.4.experts.42.w2.weight_scale": "consolidated-00010-of-00013.safetensors", "layers.4.experts.42.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.42.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.42.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.43.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.43.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.43.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.43.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.43.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.43.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.43.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.43.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.43.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.44.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.44.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.44.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.44.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.44.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.44.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.44.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.44.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.44.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.45.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.45.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.45.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.45.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.45.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.45.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.45.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.45.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.45.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.46.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.46.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.46.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.46.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.46.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.46.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.46.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.46.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.46.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.47.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.47.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.47.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.47.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.47.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.47.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.47.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.47.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.47.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.48.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.48.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.48.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.48.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.48.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.48.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.48.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.48.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.48.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.49.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.49.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.49.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.49.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.49.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.49.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.49.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.49.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.49.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.5.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.5.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.5.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.5.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.5.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.5.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.5.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.5.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.5.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.50.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.50.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.50.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.50.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.50.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.50.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.50.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.50.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.50.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.51.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.51.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.51.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.51.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.51.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.51.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.51.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.51.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.51.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.52.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.52.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.52.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.52.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.52.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.52.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.52.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.52.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.52.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.53.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.53.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.53.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.53.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.53.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.53.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.53.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.53.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.53.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.54.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.54.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.54.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.54.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.54.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.54.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.54.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.54.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.54.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.55.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.55.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.55.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.55.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.55.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.55.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.55.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.55.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.55.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.56.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.56.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.56.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.56.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.56.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.56.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.56.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.56.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.56.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.57.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.57.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.57.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.57.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.57.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.57.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.57.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.57.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.57.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.58.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.58.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.58.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.58.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.58.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.58.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.58.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.58.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.58.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.59.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.59.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.59.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.59.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.59.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.59.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.59.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.59.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.59.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.6.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.6.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.6.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.6.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.6.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.6.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.6.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.6.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.6.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.60.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.60.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.60.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.60.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.60.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.60.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.60.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.60.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.60.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.61.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.61.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.61.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.61.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.61.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.61.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.61.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.61.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.61.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.62.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.62.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.62.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.62.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.62.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.62.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.62.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.62.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.62.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.63.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.63.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.63.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.63.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.63.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.63.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.63.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.63.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.63.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.64.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.64.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.64.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.64.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.64.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.64.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.64.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.64.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.64.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.65.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.65.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.65.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.65.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.65.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.65.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.65.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.65.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.65.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.66.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.66.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.66.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.66.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.66.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.66.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.66.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.66.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.66.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.67.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.67.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.67.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.67.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.67.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.67.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.67.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.67.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.67.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.68.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.68.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.68.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.68.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.68.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.68.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.68.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.68.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.68.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.69.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.69.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.69.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.69.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.69.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.69.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.69.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.69.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.69.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.7.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.7.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.7.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.7.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.7.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.7.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.7.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.7.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.7.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.70.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.70.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.70.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.70.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.70.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.70.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.70.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.70.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.70.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.71.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.71.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.71.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.71.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.71.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.71.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.71.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.71.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.71.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.72.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.72.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.72.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.72.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.72.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.72.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.72.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.72.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.72.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.73.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.73.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.73.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.73.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.73.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.73.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.73.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.73.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.73.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.74.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.74.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.74.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.74.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.74.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.74.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.74.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.74.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.74.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.75.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.75.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.75.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.75.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.75.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.75.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.75.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.75.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.75.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.76.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.76.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.76.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.76.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.76.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.76.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.76.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.76.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.76.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.77.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.77.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.77.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.77.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.77.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.77.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.77.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.77.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.77.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.78.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.78.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.78.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.78.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.78.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.78.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.78.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.78.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.78.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.79.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.79.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.79.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.79.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.79.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.79.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.79.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.79.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.79.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.8.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.8.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.8.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.8.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.8.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.8.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.8.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.8.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.8.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.80.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.80.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.80.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.80.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.80.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.80.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.80.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.80.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.80.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.81.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.81.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.81.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.81.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.81.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.81.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.81.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.81.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.81.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.82.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.82.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.82.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.82.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.82.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.82.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.82.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.82.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.82.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.83.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.83.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.83.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.83.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.83.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.83.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.83.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.83.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.83.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.84.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.84.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.84.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.84.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.84.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.84.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.84.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.84.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.84.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.85.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.85.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.85.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.85.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.85.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.85.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.85.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.85.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.85.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.86.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.86.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.86.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.86.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.86.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.86.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.86.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.86.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.86.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.87.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.87.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.87.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.87.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.87.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.87.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.87.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.87.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.87.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.88.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.88.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.88.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.88.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.88.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.88.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.88.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.88.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.88.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.89.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.89.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.89.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.89.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.89.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.89.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.89.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.89.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.89.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.9.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.9.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.9.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.9.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.9.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.9.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.9.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.9.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.9.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.90.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.90.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.90.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.90.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.90.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.90.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.90.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.90.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.90.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.91.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.91.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.91.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.91.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.91.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.91.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.91.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.91.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.91.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.92.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.92.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.92.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.92.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.92.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.92.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.92.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.92.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.92.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.93.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.93.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.93.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.93.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.93.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.93.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.93.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.93.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.93.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.94.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.94.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.94.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.94.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.94.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.94.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.94.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.94.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.94.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.95.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.95.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.95.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.95.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.95.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.95.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.95.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.95.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.95.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.96.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.96.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.96.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.96.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.96.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.96.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.96.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.96.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.96.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.97.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.97.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.97.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.97.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.97.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.97.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.97.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.97.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.97.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.98.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.98.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.98.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.98.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.98.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.98.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.98.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.98.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.98.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.99.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.99.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.99.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.99.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.99.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.99.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.99.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.experts.99.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.experts.99.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.ffn_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.4.gate.weight": "consolidated-00011-of-00013.safetensors", "layers.4.shared_experts.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.shared_experts.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.shared_experts.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.shared_experts.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.shared_experts.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.shared_experts.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.4.shared_experts.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.4.shared_experts.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.4.shared_experts.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.attention.kv_a_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.5.attention.q_a_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.5.attention.wkv_a_with_mqa.weight": "consolidated-00011-of-00013.safetensors", "layers.5.attention.wkv_b.weight": "consolidated-00011-of-00013.safetensors", "layers.5.attention.wo.weight": "consolidated-00011-of-00013.safetensors", "layers.5.attention.wq_a.weight": "consolidated-00011-of-00013.safetensors", "layers.5.attention.wq_b.weight": "consolidated-00011-of-00013.safetensors", "layers.5.attention_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.5.experts.0.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.0.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.0.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.0.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.0.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.0.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.0.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.0.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.0.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.1.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.1.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.1.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.1.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.1.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.1.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.1.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.1.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.1.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.10.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.10.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.10.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.10.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.10.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.10.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.10.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.10.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.10.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.100.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.100.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.100.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.100.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.100.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.100.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.100.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.100.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.100.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.101.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.101.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.101.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.101.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.101.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.101.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.101.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.101.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.101.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.102.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.102.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.102.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.102.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.102.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.102.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.102.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.102.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.102.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.103.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.103.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.103.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.103.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.103.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.103.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.103.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.103.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.103.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.104.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.104.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.104.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.104.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.104.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.104.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.104.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.104.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.104.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.105.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.105.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.105.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.105.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.105.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.105.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.105.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.105.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.105.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.106.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.106.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.106.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.106.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.106.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.106.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.106.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.106.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.106.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.107.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.107.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.107.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.107.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.107.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.107.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.107.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.107.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.107.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.108.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.108.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.108.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.108.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.108.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.108.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.108.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.108.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.108.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.109.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.109.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.109.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.109.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.109.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.109.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.109.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.109.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.109.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.11.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.11.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.11.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.11.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.11.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.11.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.11.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.11.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.11.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.110.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.110.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.110.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.110.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.110.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.110.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.110.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.110.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.110.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.111.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.111.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.111.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.111.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.111.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.111.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.111.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.111.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.111.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.112.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.112.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.112.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.112.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.112.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.112.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.112.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.112.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.112.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.113.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.113.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.113.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.113.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.113.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.113.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.113.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.113.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.113.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.114.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.114.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.114.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.114.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.114.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.114.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.114.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.114.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.114.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.115.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.115.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.115.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.115.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.115.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.115.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.115.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.115.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.115.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.116.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.116.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.116.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.116.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.116.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.116.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.116.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.116.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.116.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.117.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.117.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.117.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.117.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.117.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.117.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.117.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.117.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.117.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.118.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.118.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.118.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.118.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.118.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.118.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.118.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.118.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.118.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.119.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.119.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.119.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.119.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.119.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.119.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.119.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.119.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.119.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.12.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.12.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.12.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.12.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.12.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.12.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.12.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.12.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.12.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.120.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.120.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.120.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.120.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.120.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.120.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.120.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.120.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.120.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.121.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.121.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.121.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.121.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.121.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.121.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.121.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.121.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.121.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.122.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.122.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.122.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.122.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.122.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.122.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.122.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.122.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.122.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.123.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.123.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.123.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.123.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.123.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.123.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.123.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.123.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.123.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.124.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.124.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.124.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.124.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.124.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.124.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.124.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.124.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.124.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.125.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.125.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.125.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.125.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.125.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.125.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.125.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.125.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.125.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.126.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.126.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.126.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.126.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.126.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.126.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.126.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.126.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.126.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.127.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.127.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.127.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.127.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.127.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.127.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.127.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.127.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.127.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.13.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.13.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.13.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.13.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.13.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.13.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.13.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.13.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.13.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.14.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.14.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.14.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.14.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.14.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.14.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.14.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.14.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.14.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.15.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.15.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.15.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.15.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.15.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.15.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.15.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.15.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.15.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.16.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.16.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.16.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.16.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.16.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.16.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.16.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.16.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.16.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.17.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.17.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.17.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.17.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.17.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.17.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.17.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.17.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.17.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.18.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.18.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.18.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.18.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.18.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.18.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.18.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.18.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.18.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.19.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.19.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.19.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.19.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.19.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.19.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.19.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.19.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.19.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.2.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.2.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.2.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.2.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.2.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.2.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.2.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.2.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.2.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.20.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.20.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.20.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.20.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.20.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.20.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.20.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.20.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.20.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.21.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.21.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.21.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.21.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.21.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.21.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.21.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.21.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.21.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.22.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.22.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.22.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.22.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.22.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.22.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.22.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.22.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.22.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.23.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.23.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.23.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.23.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.23.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.23.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.23.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.23.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.23.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.24.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.24.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.24.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.24.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.24.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.24.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.24.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.24.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.24.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.25.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.25.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.25.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.25.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.25.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.25.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.25.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.25.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.25.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.26.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.26.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.26.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.26.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.26.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.26.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.26.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.26.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.26.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.27.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.27.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.27.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.27.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.27.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.27.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.27.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.27.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.27.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.28.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.28.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.28.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.28.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.28.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.28.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.28.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.28.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.28.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.29.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.29.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.29.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.29.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.29.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.29.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.29.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.29.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.29.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.3.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.3.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.3.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.3.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.3.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.3.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.3.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.3.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.3.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.30.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.30.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.30.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.30.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.30.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.30.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.30.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.30.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.30.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.31.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.31.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.31.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.31.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.31.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.31.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.31.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.31.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.31.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.32.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.32.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.32.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.32.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.32.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.32.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.32.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.32.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.32.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.33.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.33.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.33.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.33.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.33.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.33.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.33.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.33.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.33.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.34.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.34.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.34.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.34.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.34.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.34.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.34.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.34.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.34.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.35.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.35.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.35.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.35.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.35.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.35.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.35.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.35.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.35.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.36.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.36.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.36.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.36.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.36.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.36.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.36.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.36.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.36.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.37.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.37.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.37.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.37.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.37.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.37.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.37.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.37.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.37.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.38.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.38.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.38.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.38.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.38.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.38.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.38.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.38.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.38.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.39.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.39.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.39.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.39.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.39.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.39.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.39.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.39.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.39.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.4.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.4.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.4.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.4.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.4.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.4.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.4.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.4.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.4.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.40.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.40.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.40.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.40.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.40.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.40.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.40.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.40.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.40.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.41.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.41.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.41.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.41.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.41.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.41.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.41.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.41.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.41.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.42.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.42.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.42.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.42.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.42.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.42.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.42.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.42.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.42.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.43.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.43.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.43.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.43.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.43.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.43.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.43.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.43.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.43.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.44.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.44.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.44.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.44.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.44.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.44.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.44.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.44.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.44.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.45.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.45.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.45.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.45.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.45.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.45.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.45.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.45.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.45.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.46.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.46.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.46.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.46.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.46.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.46.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.46.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.46.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.46.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.47.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.47.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.47.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.47.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.47.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.47.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.47.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.47.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.47.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.48.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.48.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.48.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.48.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.48.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.48.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.48.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.48.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.48.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.49.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.49.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.49.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.49.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.49.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.49.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.49.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.49.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.49.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.5.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.5.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.5.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.5.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.5.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.5.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.5.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.5.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.5.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.50.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.50.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.50.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.50.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.50.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.50.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.50.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.50.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.50.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.51.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.51.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.51.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.51.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.51.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.51.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.51.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.51.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.51.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.52.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.52.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.52.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.52.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.52.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.52.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.52.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.52.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.52.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.53.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.53.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.53.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.53.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.53.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.53.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.53.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.53.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.53.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.54.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.54.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.54.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.54.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.54.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.54.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.54.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.54.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.54.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.55.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.55.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.55.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.55.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.55.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.55.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.55.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.55.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.55.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.56.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.56.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.56.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.56.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.56.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.56.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.56.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.56.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.56.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.57.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.57.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.57.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.57.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.57.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.57.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.57.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.57.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.57.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.58.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.58.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.58.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.58.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.58.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.58.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.58.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.58.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.58.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.59.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.59.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.59.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.59.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.59.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.59.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.59.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.59.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.59.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.6.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.6.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.6.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.6.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.6.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.6.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.6.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.6.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.6.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.60.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.60.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.60.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.60.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.60.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.60.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.60.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.60.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.60.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.61.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.61.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.61.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.61.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.61.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.61.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.61.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.61.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.61.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.62.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.62.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.62.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.62.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.62.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.62.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.62.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.62.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.62.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.63.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.63.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.63.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.63.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.63.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.63.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.63.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.63.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.63.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.64.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.64.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.64.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.64.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.64.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.64.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.64.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.64.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.64.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.65.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.65.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.65.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.65.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.65.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.65.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.65.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.65.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.65.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.66.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.66.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.66.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.66.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.66.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.66.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.66.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.66.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.66.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.67.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.67.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.67.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.67.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.67.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.67.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.67.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.67.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.67.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.68.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.68.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.68.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.68.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.68.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.68.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.68.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.68.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.68.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.69.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.69.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.69.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.69.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.69.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.69.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.69.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.69.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.69.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.7.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.7.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.7.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.7.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.7.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.7.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.7.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.7.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.7.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.70.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.70.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.70.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.70.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.70.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.70.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.70.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.70.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.70.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.71.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.71.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.71.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.71.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.71.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.71.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.71.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.71.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.71.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.72.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.72.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.72.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.72.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.72.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.72.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.72.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.72.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.72.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.73.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.73.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.73.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.73.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.73.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.73.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.73.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.73.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.73.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.74.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.74.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.74.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.74.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.74.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.74.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.74.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.74.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.74.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.75.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.75.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.75.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.75.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.75.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.75.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.75.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.75.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.75.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.76.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.76.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.76.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.76.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.76.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.76.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.76.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.76.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.76.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.77.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.77.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.77.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.77.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.77.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.77.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.77.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.77.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.77.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.78.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.78.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.78.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.78.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.78.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.78.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.78.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.78.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.78.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.79.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.79.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.79.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.79.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.79.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.79.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.79.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.79.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.79.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.8.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.8.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.8.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.8.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.8.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.8.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.8.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.8.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.8.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.80.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.80.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.80.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.80.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.80.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.80.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.80.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.80.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.80.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.81.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.81.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.81.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.81.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.81.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.81.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.81.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.81.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.81.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.82.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.82.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.82.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.82.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.82.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.82.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.82.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.82.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.82.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.83.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.83.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.83.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.83.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.83.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.83.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.83.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.83.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.83.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.84.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.84.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.84.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.84.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.84.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.84.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.84.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.84.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.84.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.85.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.85.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.85.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.85.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.85.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.85.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.85.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.85.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.85.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.86.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.86.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.86.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.86.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.86.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.86.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.86.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.86.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.86.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.87.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.87.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.87.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.87.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.87.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.87.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.87.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.87.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.87.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.88.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.88.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.88.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.88.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.88.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.88.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.88.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.88.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.88.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.89.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.89.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.89.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.89.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.89.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.89.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.89.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.89.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.89.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.9.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.9.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.9.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.9.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.9.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.9.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.9.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.9.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.9.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.90.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.90.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.90.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.90.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.90.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.90.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.90.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.90.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.90.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.91.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.91.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.91.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.91.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.91.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.91.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.91.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.91.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.91.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.92.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.92.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.92.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.92.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.92.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.92.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.92.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.92.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.92.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.93.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.93.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.93.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.93.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.93.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.93.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.93.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.93.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.93.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.94.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.94.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.94.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.94.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.94.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.94.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.94.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.94.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.94.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.95.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.95.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.95.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.95.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.95.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.95.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.95.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.95.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.95.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.96.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.96.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.96.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.96.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.96.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.96.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.96.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.96.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.96.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.97.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.97.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.97.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.97.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.97.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.97.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.97.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.97.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.97.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.98.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.98.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.98.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.98.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.98.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.98.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.98.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.98.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.98.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.99.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.99.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.99.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.99.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.99.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.99.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.99.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.experts.99.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.experts.99.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.ffn_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.5.gate.weight": "consolidated-00011-of-00013.safetensors", "layers.5.shared_experts.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.shared_experts.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.shared_experts.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.shared_experts.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.shared_experts.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.shared_experts.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.5.shared_experts.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.5.shared_experts.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.5.shared_experts.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.attention.kv_a_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.6.attention.q_a_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.6.attention.wkv_a_with_mqa.weight": "consolidated-00011-of-00013.safetensors", "layers.6.attention.wkv_b.weight": "consolidated-00011-of-00013.safetensors", "layers.6.attention.wo.weight": "consolidated-00011-of-00013.safetensors", "layers.6.attention.wq_a.weight": "consolidated-00011-of-00013.safetensors", "layers.6.attention.wq_b.weight": "consolidated-00011-of-00013.safetensors", "layers.6.attention_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.6.experts.0.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.0.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.0.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.0.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.0.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.0.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.0.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.0.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.0.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.1.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.1.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.1.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.1.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.1.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.1.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.1.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.1.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.1.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.10.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.10.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.10.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.10.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.10.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.10.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.10.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.10.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.10.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.100.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.100.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.100.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.100.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.100.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.100.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.100.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.100.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.100.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.101.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.101.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.101.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.101.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.101.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.101.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.101.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.101.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.101.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.102.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.102.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.102.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.102.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.102.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.102.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.102.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.102.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.102.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.103.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.103.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.103.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.103.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.103.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.103.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.103.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.103.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.103.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.104.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.104.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.104.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.104.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.104.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.104.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.104.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.104.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.104.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.105.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.105.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.105.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.105.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.105.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.105.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.105.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.105.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.105.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.106.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.106.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.106.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.106.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.106.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.106.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.106.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.106.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.106.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.107.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.107.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.107.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.107.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.107.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.107.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.107.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.107.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.107.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.108.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.108.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.108.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.108.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.108.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.108.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.108.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.108.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.108.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.109.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.109.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.109.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.109.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.109.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.109.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.109.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.109.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.109.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.11.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.11.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.11.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.11.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.11.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.11.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.11.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.11.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.11.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.110.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.110.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.110.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.110.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.110.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.110.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.110.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.110.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.110.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.111.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.111.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.111.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.111.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.111.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.111.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.111.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.111.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.111.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.112.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.112.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.112.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.112.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.112.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.112.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.112.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.112.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.112.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.113.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.113.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.113.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.113.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.113.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.113.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.113.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.113.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.113.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.114.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.114.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.114.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.114.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.114.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.114.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.114.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.114.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.114.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.115.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.115.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.115.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.115.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.115.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.115.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.115.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.115.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.115.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.116.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.116.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.116.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.116.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.116.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.116.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.116.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.116.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.116.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.117.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.117.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.117.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.117.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.117.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.117.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.117.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.117.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.117.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.118.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.118.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.118.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.118.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.118.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.118.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.118.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.118.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.118.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.119.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.119.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.119.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.119.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.119.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.119.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.119.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.119.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.119.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.12.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.12.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.12.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.12.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.12.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.12.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.12.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.12.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.12.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.120.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.120.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.120.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.120.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.120.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.120.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.120.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.120.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.120.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.121.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.121.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.121.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.121.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.121.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.121.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.121.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.121.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.121.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.122.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.122.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.122.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.122.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.122.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.122.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.122.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.122.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.122.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.123.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.123.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.123.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.123.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.123.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.123.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.123.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.123.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.123.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.124.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.124.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.124.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.124.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.124.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.124.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.124.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.124.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.124.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.125.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.125.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.125.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.125.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.125.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.125.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.125.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.125.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.125.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.126.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.126.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.126.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.126.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.126.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.126.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.126.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.126.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.126.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.127.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.127.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.127.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.127.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.127.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.127.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.127.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.127.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.127.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.13.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.13.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.13.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.13.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.13.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.13.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.13.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.13.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.13.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.14.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.14.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.14.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.14.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.14.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.14.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.14.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.14.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.14.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.15.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.15.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.15.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.15.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.15.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.15.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.15.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.15.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.15.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.16.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.16.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.16.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.16.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.16.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.16.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.16.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.16.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.16.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.17.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.17.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.17.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.17.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.17.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.17.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.17.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.17.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.17.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.18.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.18.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.18.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.18.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.18.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.18.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.18.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.18.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.18.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.19.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.19.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.19.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.19.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.19.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.19.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.19.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.19.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.19.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.2.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.2.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.2.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.2.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.2.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.2.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.2.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.2.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.2.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.20.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.20.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.20.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.20.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.20.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.20.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.20.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.20.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.20.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.21.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.21.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.21.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.21.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.21.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.21.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.21.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.21.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.21.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.22.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.22.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.22.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.22.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.22.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.22.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.22.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.22.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.22.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.23.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.23.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.23.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.23.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.23.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.23.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.23.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.23.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.23.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.24.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.24.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.24.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.24.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.24.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.24.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.24.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.24.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.24.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.25.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.25.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.25.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.25.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.25.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.25.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.25.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.25.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.25.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.26.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.26.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.26.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.26.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.26.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.26.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.26.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.26.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.26.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.27.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.27.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.27.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.27.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.27.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.27.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.27.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.27.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.27.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.28.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.28.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.28.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.28.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.28.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.28.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.28.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.28.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.28.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.29.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.29.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.29.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.29.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.29.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.29.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.29.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.29.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.29.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.3.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.3.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.3.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.3.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.3.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.3.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.3.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.3.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.3.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.30.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.30.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.30.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.30.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.30.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.30.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.30.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.30.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.30.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.31.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.31.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.31.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.31.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.31.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.31.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.31.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.31.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.31.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.32.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.32.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.32.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.32.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.32.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.32.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.32.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.32.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.32.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.33.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.33.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.33.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.33.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.33.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.33.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.33.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.33.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.33.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.34.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.34.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.34.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.34.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.34.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.34.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.34.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.34.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.34.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.35.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.35.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.35.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.35.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.35.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.35.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.35.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.35.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.35.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.36.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.36.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.36.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.36.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.36.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.36.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.36.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.36.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.36.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.37.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.37.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.37.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.37.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.37.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.37.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.37.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.37.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.37.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.38.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.38.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.38.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.38.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.38.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.38.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.38.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.38.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.38.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.39.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.39.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.39.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.39.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.39.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.39.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.39.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.39.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.39.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.4.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.4.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.4.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.4.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.4.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.4.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.4.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.4.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.4.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.40.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.40.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.40.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.40.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.40.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.40.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.40.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.40.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.40.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.41.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.41.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.41.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.41.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.41.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.41.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.41.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.41.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.41.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.42.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.42.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.42.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.42.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.42.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.42.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.42.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.42.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.42.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.43.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.43.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.43.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.43.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.43.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.43.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.43.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.43.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.43.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.44.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.44.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.44.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.44.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.44.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.44.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.44.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.44.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.44.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.45.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.45.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.45.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.45.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.45.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.45.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.45.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.45.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.45.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.46.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.46.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.46.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.46.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.46.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.46.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.46.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.46.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.46.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.47.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.47.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.47.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.47.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.47.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.47.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.47.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.47.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.47.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.48.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.48.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.48.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.48.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.48.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.48.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.48.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.48.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.48.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.49.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.49.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.49.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.49.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.49.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.49.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.49.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.49.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.49.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.5.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.5.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.5.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.5.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.5.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.5.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.5.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.5.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.5.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.50.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.50.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.50.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.50.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.50.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.50.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.50.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.50.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.50.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.51.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.51.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.51.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.51.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.51.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.51.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.51.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.51.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.51.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.52.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.52.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.52.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.52.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.52.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.52.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.52.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.52.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.52.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.53.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.53.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.53.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.53.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.53.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.53.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.53.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.53.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.53.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.54.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.54.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.54.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.54.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.54.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.54.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.54.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.54.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.54.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.55.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.55.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.55.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.55.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.55.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.55.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.55.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.55.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.55.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.56.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.56.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.56.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.56.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.56.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.56.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.56.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.56.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.56.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.57.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.57.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.57.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.57.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.57.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.57.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.57.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.57.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.57.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.58.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.58.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.58.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.58.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.58.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.58.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.58.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.58.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.58.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.59.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.59.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.59.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.59.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.59.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.59.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.59.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.59.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.59.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.6.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.6.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.6.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.6.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.6.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.6.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.6.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.6.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.6.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.60.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.60.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.60.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.60.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.60.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.60.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.60.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.60.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.60.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.61.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.61.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.61.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.61.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.61.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.61.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.61.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.61.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.61.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.62.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.62.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.62.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.62.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.62.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.62.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.62.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.62.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.62.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.63.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.63.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.63.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.63.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.63.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.63.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.63.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.63.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.63.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.64.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.64.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.64.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.64.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.64.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.64.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.64.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.64.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.64.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.65.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.65.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.65.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.65.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.65.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.65.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.65.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.65.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.65.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.66.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.66.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.66.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.66.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.66.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.66.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.66.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.66.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.66.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.67.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.67.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.67.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.67.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.67.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.67.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.67.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.67.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.67.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.68.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.68.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.68.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.68.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.68.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.68.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.68.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.68.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.68.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.69.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.69.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.69.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.69.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.69.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.69.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.69.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.69.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.69.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.7.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.7.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.7.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.7.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.7.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.7.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.7.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.7.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.7.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.70.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.70.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.70.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.70.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.70.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.70.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.70.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.70.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.70.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.71.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.71.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.71.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.71.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.71.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.71.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.71.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.71.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.71.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.72.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.72.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.72.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.72.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.72.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.72.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.72.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.72.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.72.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.73.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.73.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.73.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.73.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.73.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.73.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.73.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.73.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.73.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.74.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.74.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.74.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.74.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.74.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.74.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.74.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.74.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.74.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.75.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.75.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.75.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.75.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.75.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.75.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.75.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.75.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.75.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.76.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.76.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.76.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.76.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.76.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.76.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.76.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.76.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.76.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.77.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.77.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.77.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.77.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.77.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.77.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.77.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.77.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.77.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.78.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.78.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.78.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.78.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.78.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.78.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.78.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.78.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.78.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.79.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.79.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.79.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.79.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.79.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.79.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.79.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.79.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.79.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.8.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.8.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.8.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.8.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.8.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.8.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.8.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.8.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.8.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.80.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.80.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.80.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.80.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.80.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.80.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.80.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.80.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.80.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.81.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.81.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.81.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.81.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.81.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.81.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.81.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.81.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.81.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.82.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.82.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.82.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.82.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.82.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.82.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.82.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.82.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.82.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.83.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.83.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.83.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.83.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.83.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.83.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.83.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.83.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.83.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.84.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.84.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.84.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.84.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.84.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.84.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.84.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.84.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.84.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.85.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.85.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.85.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.85.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.85.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.85.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.85.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.85.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.85.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.86.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.86.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.86.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.86.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.86.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.86.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.86.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.86.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.86.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.87.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.87.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.87.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.87.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.87.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.87.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.87.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.87.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.87.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.88.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.88.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.88.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.88.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.88.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.88.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.88.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.88.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.88.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.89.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.89.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.89.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.89.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.89.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.89.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.89.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.89.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.89.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.9.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.9.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.9.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.9.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.9.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.9.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.9.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.9.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.9.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.90.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.90.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.90.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.90.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.90.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.90.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.90.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.90.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.90.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.91.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.91.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.91.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.91.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.91.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.91.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.91.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.91.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.91.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.92.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.92.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.92.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.92.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.92.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.92.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.92.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.92.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.92.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.93.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.93.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.93.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.93.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.93.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.93.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.93.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.93.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.93.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.94.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.94.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.94.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.94.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.94.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.94.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.94.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.94.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.94.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.95.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.95.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.95.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.95.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.95.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.95.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.95.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.95.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.95.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.96.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.96.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.96.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.96.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.96.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.96.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.96.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.96.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.96.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.97.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.97.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.97.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.97.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.97.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.97.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.97.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.97.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.97.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.98.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.98.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.98.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.98.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.98.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.98.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.98.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.98.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.98.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.99.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.99.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.99.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.99.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.99.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.99.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.99.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.experts.99.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.experts.99.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.ffn_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.6.gate.weight": "consolidated-00011-of-00013.safetensors", "layers.6.shared_experts.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.shared_experts.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.shared_experts.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.shared_experts.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.shared_experts.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.shared_experts.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.6.shared_experts.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.6.shared_experts.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.6.shared_experts.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.attention.kv_a_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.7.attention.q_a_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.7.attention.wkv_a_with_mqa.weight": "consolidated-00011-of-00013.safetensors", "layers.7.attention.wkv_b.weight": "consolidated-00011-of-00013.safetensors", "layers.7.attention.wo.weight": "consolidated-00011-of-00013.safetensors", "layers.7.attention.wq_a.weight": "consolidated-00011-of-00013.safetensors", "layers.7.attention.wq_b.weight": "consolidated-00011-of-00013.safetensors", "layers.7.attention_norm.weight": "consolidated-00011-of-00013.safetensors", "layers.7.experts.0.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.0.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.0.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.0.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.0.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.0.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.0.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.0.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.0.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.1.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.1.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.1.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.1.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.1.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.1.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.1.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.1.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.1.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.10.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.10.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.10.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.10.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.10.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.10.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.10.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.10.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.10.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.100.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.100.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.100.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.100.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.100.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.100.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.100.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.100.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.100.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.101.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.101.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.101.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.101.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.101.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.101.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.101.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.101.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.101.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.102.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.102.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.102.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.102.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.102.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.102.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.102.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.102.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.102.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.103.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.103.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.103.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.103.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.103.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.103.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.103.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.103.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.103.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.104.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.104.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.104.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.104.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.104.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.104.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.104.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.104.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.104.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.105.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.105.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.105.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.105.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.105.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.105.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.105.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.105.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.105.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.106.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.106.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.106.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.106.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.106.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.106.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.106.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.106.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.106.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.107.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.107.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.107.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.107.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.107.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.107.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.107.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.107.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.107.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.108.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.108.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.108.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.108.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.108.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.108.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.108.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.108.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.108.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.109.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.109.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.109.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.109.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.109.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.109.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.109.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.109.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.109.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.11.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.11.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.11.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.11.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.11.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.11.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.11.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.11.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.11.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.110.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.110.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.110.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.110.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.110.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.110.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.110.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.110.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.110.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.111.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.111.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.111.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.111.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.111.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.111.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.111.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.111.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.111.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.112.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.112.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.112.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.112.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.112.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.112.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.112.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.112.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.112.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.113.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.113.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.113.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.113.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.113.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.113.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.113.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.113.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.113.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.114.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.114.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.114.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.114.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.114.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.114.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.114.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.114.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.114.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.115.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.115.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.115.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.115.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.115.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.115.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.115.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.115.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.115.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.116.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.116.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.116.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.116.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.116.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.116.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.116.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.116.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.116.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.117.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.117.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.117.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.117.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.117.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.117.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.117.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.117.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.117.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.118.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.118.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.118.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.118.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.118.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.118.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.118.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.118.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.118.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.119.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.119.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.119.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.119.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.119.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.119.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.119.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.119.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.119.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.12.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.12.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.12.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.12.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.12.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.12.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.12.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.12.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.12.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.120.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.120.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.120.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.120.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.120.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.120.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.120.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.120.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.120.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.121.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.121.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.121.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.121.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.121.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.121.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.121.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.121.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.121.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.122.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.122.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.122.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.122.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.122.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.122.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.122.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.122.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.122.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.123.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.123.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.123.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.123.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.123.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.123.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.123.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.123.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.123.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.124.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.124.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.124.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.124.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.124.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.124.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.124.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.124.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.124.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.125.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.125.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.125.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.125.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.125.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.125.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.125.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.125.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.125.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.126.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.126.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.126.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.126.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.126.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.126.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.126.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.126.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.126.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.127.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.127.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.127.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.127.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.127.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.127.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.127.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.127.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.127.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.13.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.13.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.13.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.13.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.13.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.13.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.13.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.13.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.13.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.14.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.14.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.14.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.14.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.14.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.14.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.14.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.14.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.14.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.15.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.15.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.15.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.15.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.15.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.15.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.15.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.15.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.15.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.16.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.16.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.16.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.16.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.16.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.16.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.16.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.16.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.16.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.17.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.17.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.17.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.17.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.17.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.17.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.17.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.17.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.17.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.18.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.18.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.18.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.18.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.18.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.18.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.18.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.18.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.18.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.19.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.19.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.19.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.19.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.19.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.19.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.19.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.19.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.19.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.2.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.2.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.2.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.2.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.2.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.2.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.2.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.2.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.2.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.20.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.20.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.20.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.20.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.20.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.20.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.20.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.20.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.20.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.21.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.21.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.21.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.21.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.21.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.21.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.21.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.21.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.21.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.22.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.22.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.22.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.22.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.22.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.22.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.22.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.22.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.22.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.23.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.23.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.23.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.23.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.23.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.23.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.23.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.23.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.23.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.24.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.24.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.24.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.24.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.24.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.24.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.24.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.24.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.24.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.25.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.25.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.25.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.25.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.25.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.25.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.25.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.25.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.25.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.26.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.26.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.26.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.26.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.26.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.26.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.26.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.26.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.26.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.27.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.27.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.27.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.27.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.27.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.27.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.27.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.27.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.27.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.28.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.28.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.28.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.28.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.28.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.28.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.28.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.28.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.28.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.29.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.29.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.29.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.29.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.29.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.29.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.29.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.29.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.29.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.3.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.3.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.3.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.3.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.3.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.3.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.3.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.3.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.3.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.30.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.30.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.30.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.30.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.30.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.30.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.30.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.30.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.30.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.31.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.31.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.31.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.31.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.31.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.31.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.31.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.31.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.31.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.32.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.32.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.32.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.32.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.32.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.32.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.32.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.32.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.32.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.33.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.33.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.33.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.33.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.33.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.33.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.33.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.33.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.33.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.34.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.34.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.34.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.34.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.34.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.34.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.34.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.34.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.34.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.35.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.35.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.35.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.35.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.35.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.35.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.35.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.35.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.35.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.36.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.36.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.36.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.36.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.36.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.36.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.36.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.36.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.36.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.37.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.37.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.37.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.37.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.37.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.37.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.37.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.37.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.37.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.38.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.38.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.38.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.38.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.38.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.38.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.38.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.38.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.38.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.39.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.39.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.39.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.39.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.39.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.39.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.39.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.39.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.39.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.4.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.4.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.4.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.4.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.4.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.4.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.4.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.4.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.4.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.40.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.40.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.40.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.40.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.40.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.40.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.40.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.40.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.40.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.41.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.41.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.41.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.41.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.41.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.41.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.41.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.41.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.41.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.42.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.42.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.42.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.42.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.42.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.42.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.42.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.42.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.42.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.43.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.43.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.43.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.43.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.43.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.43.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.43.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.43.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.43.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.44.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.44.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.44.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.44.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.44.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.44.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.44.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.44.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.44.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.45.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.45.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.45.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.45.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.45.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.45.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.45.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.45.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.45.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.46.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.46.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.46.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.46.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.46.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.46.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.46.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.46.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.46.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.47.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.47.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.47.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.47.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.47.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.47.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.47.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.47.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.47.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.48.w1.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.48.w1.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.48.w1.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.48.w2.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.48.w2.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.48.w2.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.48.w3.weight_global_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.48.w3.weight_packed": "consolidated-00011-of-00013.safetensors", "layers.7.experts.48.w3.weight_scale": "consolidated-00011-of-00013.safetensors", "layers.7.experts.49.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.49.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.49.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.49.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.49.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.49.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.49.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.49.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.49.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.5.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.5.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.5.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.5.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.5.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.5.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.5.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.5.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.5.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.50.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.50.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.50.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.50.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.50.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.50.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.50.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.50.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.50.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.51.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.51.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.51.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.51.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.51.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.51.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.51.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.51.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.51.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.52.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.52.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.52.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.52.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.52.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.52.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.52.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.52.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.52.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.53.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.53.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.53.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.53.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.53.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.53.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.53.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.53.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.53.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.54.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.54.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.54.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.54.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.54.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.54.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.54.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.54.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.54.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.55.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.55.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.55.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.55.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.55.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.55.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.55.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.55.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.55.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.56.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.56.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.56.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.56.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.56.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.56.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.56.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.56.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.56.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.57.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.57.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.57.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.57.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.57.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.57.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.57.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.57.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.57.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.58.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.58.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.58.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.58.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.58.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.58.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.58.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.58.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.58.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.59.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.59.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.59.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.59.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.59.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.59.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.59.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.59.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.59.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.6.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.6.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.6.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.6.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.6.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.6.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.6.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.6.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.6.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.60.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.60.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.60.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.60.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.60.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.60.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.60.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.60.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.60.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.61.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.61.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.61.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.61.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.61.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.61.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.61.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.61.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.61.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.62.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.62.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.62.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.62.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.62.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.62.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.62.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.62.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.62.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.63.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.63.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.63.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.63.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.63.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.63.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.63.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.63.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.63.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.64.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.64.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.64.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.64.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.64.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.64.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.64.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.64.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.64.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.65.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.65.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.65.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.65.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.65.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.65.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.65.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.65.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.65.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.66.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.66.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.66.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.66.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.66.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.66.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.66.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.66.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.66.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.67.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.67.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.67.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.67.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.67.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.67.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.67.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.67.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.67.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.68.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.68.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.68.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.68.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.68.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.68.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.68.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.68.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.68.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.69.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.69.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.69.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.69.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.69.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.69.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.69.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.69.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.69.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.7.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.7.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.7.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.7.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.7.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.7.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.7.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.7.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.7.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.70.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.70.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.70.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.70.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.70.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.70.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.70.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.70.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.70.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.71.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.71.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.71.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.71.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.71.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.71.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.71.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.71.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.71.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.72.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.72.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.72.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.72.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.72.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.72.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.72.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.72.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.72.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.73.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.73.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.73.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.73.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.73.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.73.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.73.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.73.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.73.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.74.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.74.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.74.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.74.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.74.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.74.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.74.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.74.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.74.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.75.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.75.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.75.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.75.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.75.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.75.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.75.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.75.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.75.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.76.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.76.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.76.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.76.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.76.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.76.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.76.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.76.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.76.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.77.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.77.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.77.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.77.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.77.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.77.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.77.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.77.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.77.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.78.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.78.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.78.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.78.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.78.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.78.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.78.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.78.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.78.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.79.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.79.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.79.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.79.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.79.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.79.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.79.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.79.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.79.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.8.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.8.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.8.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.8.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.8.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.8.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.8.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.8.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.8.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.80.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.80.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.80.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.80.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.80.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.80.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.80.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.80.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.80.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.81.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.81.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.81.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.81.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.81.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.81.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.81.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.81.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.81.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.82.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.82.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.82.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.82.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.82.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.82.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.82.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.82.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.82.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.83.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.83.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.83.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.83.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.83.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.83.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.83.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.83.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.83.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.84.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.84.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.84.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.84.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.84.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.84.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.84.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.84.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.84.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.85.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.85.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.85.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.85.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.85.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.85.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.85.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.85.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.85.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.86.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.86.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.86.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.86.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.86.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.86.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.86.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.86.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.86.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.87.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.87.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.87.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.87.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.87.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.87.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.87.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.87.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.87.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.88.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.88.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.88.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.88.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.88.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.88.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.88.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.88.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.88.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.89.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.89.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.89.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.89.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.89.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.89.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.89.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.89.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.89.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.9.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.9.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.9.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.9.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.9.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.9.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.9.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.9.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.9.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.90.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.90.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.90.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.90.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.90.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.90.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.90.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.90.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.90.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.91.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.91.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.91.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.91.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.91.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.91.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.91.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.91.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.91.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.92.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.92.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.92.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.92.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.92.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.92.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.92.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.92.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.92.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.93.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.93.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.93.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.93.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.93.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.93.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.93.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.93.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.93.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.94.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.94.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.94.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.94.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.94.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.94.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.94.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.94.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.94.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.95.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.95.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.95.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.95.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.95.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.95.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.95.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.95.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.95.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.96.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.96.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.96.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.96.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.96.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.96.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.96.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.96.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.96.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.97.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.97.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.97.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.97.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.97.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.97.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.97.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.97.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.97.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.98.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.98.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.98.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.98.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.98.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.98.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.98.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.98.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.98.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.99.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.99.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.99.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.99.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.99.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.99.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.99.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.experts.99.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.experts.99.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "layers.7.gate.weight": "consolidated-00012-of-00013.safetensors", "layers.7.shared_experts.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.shared_experts.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.shared_experts.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.shared_experts.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.shared_experts.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.shared_experts.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.7.shared_experts.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.7.shared_experts.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.7.shared_experts.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.attention.kv_a_norm.weight": "consolidated-00012-of-00013.safetensors", "layers.8.attention.q_a_norm.weight": "consolidated-00012-of-00013.safetensors", "layers.8.attention.wkv_a_with_mqa.weight": "consolidated-00012-of-00013.safetensors", "layers.8.attention.wkv_b.weight": "consolidated-00012-of-00013.safetensors", "layers.8.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "layers.8.attention.wq_a.weight": "consolidated-00012-of-00013.safetensors", "layers.8.attention.wq_b.weight": "consolidated-00012-of-00013.safetensors", "layers.8.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "layers.8.experts.0.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.0.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.0.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.0.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.0.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.0.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.0.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.0.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.0.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.1.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.1.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.1.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.1.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.1.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.1.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.1.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.1.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.1.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.10.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.10.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.10.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.10.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.10.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.10.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.10.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.10.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.10.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.100.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.100.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.100.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.100.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.100.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.100.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.100.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.100.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.100.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.101.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.101.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.101.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.101.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.101.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.101.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.101.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.101.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.101.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.102.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.102.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.102.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.102.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.102.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.102.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.102.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.102.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.102.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.103.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.103.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.103.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.103.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.103.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.103.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.103.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.103.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.103.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.104.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.104.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.104.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.104.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.104.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.104.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.104.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.104.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.104.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.105.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.105.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.105.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.105.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.105.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.105.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.105.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.105.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.105.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.106.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.106.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.106.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.106.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.106.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.106.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.106.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.106.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.106.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.107.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.107.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.107.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.107.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.107.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.107.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.107.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.107.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.107.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.108.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.108.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.108.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.108.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.108.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.108.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.108.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.108.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.108.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.109.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.109.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.109.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.109.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.109.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.109.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.109.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.109.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.109.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.11.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.11.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.11.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.11.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.11.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.11.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.11.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.11.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.11.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.110.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.110.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.110.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.110.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.110.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.110.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.110.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.110.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.110.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.111.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.111.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.111.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.111.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.111.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.111.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.111.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.111.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.111.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.112.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.112.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.112.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.112.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.112.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.112.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.112.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.112.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.112.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.113.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.113.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.113.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.113.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.113.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.113.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.113.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.113.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.113.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.114.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.114.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.114.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.114.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.114.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.114.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.114.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.114.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.114.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.115.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.115.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.115.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.115.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.115.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.115.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.115.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.115.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.115.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.116.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.116.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.116.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.116.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.116.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.116.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.116.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.116.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.116.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.117.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.117.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.117.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.117.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.117.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.117.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.117.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.117.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.117.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.118.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.118.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.118.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.118.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.118.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.118.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.118.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.118.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.118.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.119.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.119.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.119.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.119.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.119.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.119.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.119.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.119.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.119.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.12.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.12.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.12.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.12.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.12.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.12.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.12.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.12.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.12.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.120.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.120.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.120.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.120.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.120.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.120.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.120.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.120.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.120.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.121.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.121.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.121.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.121.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.121.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.121.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.121.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.121.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.121.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.122.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.122.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.122.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.122.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.122.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.122.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.122.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.122.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.122.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.123.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.123.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.123.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.123.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.123.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.123.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.123.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.123.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.123.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.124.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.124.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.124.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.124.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.124.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.124.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.124.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.124.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.124.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.125.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.125.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.125.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.125.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.125.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.125.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.125.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.125.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.125.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.126.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.126.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.126.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.126.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.126.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.126.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.126.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.126.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.126.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.127.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.127.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.127.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.127.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.127.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.127.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.127.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.127.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.127.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.13.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.13.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.13.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.13.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.13.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.13.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.13.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.13.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.13.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.14.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.14.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.14.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.14.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.14.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.14.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.14.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.14.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.14.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.15.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.15.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.15.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.15.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.15.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.15.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.15.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.15.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.15.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.16.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.16.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.16.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.16.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.16.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.16.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.16.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.16.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.16.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.17.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.17.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.17.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.17.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.17.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.17.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.17.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.17.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.17.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.18.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.18.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.18.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.18.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.18.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.18.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.18.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.18.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.18.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.19.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.19.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.19.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.19.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.19.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.19.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.19.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.19.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.19.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.2.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.2.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.2.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.2.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.2.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.2.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.2.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.2.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.2.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.20.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.20.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.20.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.20.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.20.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.20.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.20.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.20.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.20.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.21.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.21.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.21.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.21.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.21.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.21.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.21.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.21.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.21.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.22.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.22.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.22.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.22.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.22.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.22.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.22.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.22.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.22.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.23.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.23.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.23.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.23.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.23.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.23.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.23.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.23.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.23.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.24.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.24.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.24.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.24.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.24.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.24.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.24.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.24.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.24.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.25.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.25.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.25.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.25.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.25.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.25.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.25.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.25.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.25.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.26.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.26.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.26.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.26.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.26.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.26.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.26.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.26.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.26.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.27.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.27.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.27.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.27.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.27.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.27.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.27.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.27.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.27.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.28.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.28.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.28.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.28.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.28.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.28.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.28.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.28.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.28.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.29.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.29.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.29.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.29.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.29.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.29.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.29.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.29.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.29.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.3.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.3.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.3.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.3.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.3.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.3.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.3.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.3.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.3.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.30.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.30.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.30.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.30.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.30.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.30.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.30.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.30.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.30.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.31.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.31.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.31.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.31.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.31.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.31.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.31.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.31.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.31.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.32.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.32.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.32.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.32.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.32.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.32.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.32.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.32.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.32.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.33.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.33.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.33.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.33.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.33.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.33.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.33.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.33.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.33.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.34.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.34.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.34.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.34.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.34.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.34.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.34.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.34.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.34.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.35.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.35.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.35.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.35.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.35.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.35.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.35.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.35.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.35.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.36.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.36.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.36.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.36.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.36.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.36.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.36.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.36.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.36.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.37.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.37.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.37.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.37.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.37.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.37.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.37.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.37.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.37.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.38.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.38.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.38.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.38.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.38.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.38.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.38.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.38.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.38.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.39.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.39.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.39.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.39.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.39.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.39.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.39.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.39.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.39.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.4.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.4.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.4.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.4.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.4.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.4.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.4.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.4.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.4.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.40.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.40.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.40.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.40.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.40.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.40.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.40.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.40.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.40.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.41.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.41.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.41.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.41.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.41.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.41.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.41.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.41.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.41.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.42.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.42.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.42.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.42.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.42.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.42.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.42.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.42.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.42.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.43.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.43.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.43.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.43.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.43.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.43.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.43.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.43.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.43.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.44.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.44.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.44.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.44.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.44.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.44.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.44.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.44.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.44.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.45.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.45.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.45.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.45.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.45.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.45.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.45.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.45.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.45.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.46.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.46.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.46.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.46.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.46.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.46.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.46.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.46.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.46.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.47.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.47.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.47.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.47.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.47.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.47.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.47.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.47.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.47.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.48.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.48.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.48.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.48.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.48.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.48.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.48.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.48.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.48.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.49.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.49.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.49.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.49.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.49.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.49.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.49.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.49.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.49.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.5.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.5.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.5.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.5.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.5.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.5.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.5.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.5.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.5.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.50.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.50.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.50.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.50.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.50.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.50.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.50.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.50.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.50.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.51.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.51.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.51.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.51.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.51.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.51.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.51.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.51.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.51.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.52.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.52.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.52.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.52.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.52.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.52.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.52.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.52.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.52.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.53.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.53.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.53.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.53.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.53.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.53.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.53.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.53.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.53.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.54.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.54.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.54.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.54.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.54.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.54.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.54.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.54.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.54.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.55.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.55.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.55.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.55.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.55.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.55.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.55.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.55.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.55.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.56.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.56.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.56.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.56.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.56.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.56.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.56.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.56.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.56.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.57.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.57.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.57.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.57.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.57.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.57.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.57.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.57.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.57.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.58.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.58.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.58.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.58.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.58.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.58.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.58.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.58.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.58.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.59.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.59.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.59.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.59.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.59.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.59.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.59.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.59.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.59.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.6.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.6.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.6.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.6.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.6.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.6.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.6.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.6.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.6.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.60.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.60.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.60.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.60.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.60.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.60.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.60.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.60.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.60.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.61.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.61.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.61.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.61.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.61.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.61.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.61.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.61.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.61.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.62.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.62.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.62.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.62.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.62.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.62.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.62.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.62.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.62.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.63.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.63.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.63.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.63.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.63.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.63.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.63.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.63.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.63.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.64.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.64.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.64.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.64.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.64.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.64.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.64.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.64.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.64.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.65.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.65.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.65.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.65.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.65.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.65.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.65.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.65.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.65.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.66.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.66.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.66.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.66.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.66.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.66.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.66.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.66.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.66.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.67.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.67.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.67.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.67.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.67.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.67.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.67.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.67.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.67.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.68.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.68.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.68.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.68.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.68.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.68.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.68.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.68.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.68.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.69.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.69.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.69.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.69.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.69.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.69.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.69.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.69.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.69.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.7.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.7.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.7.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.7.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.7.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.7.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.7.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.7.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.7.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.70.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.70.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.70.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.70.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.70.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.70.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.70.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.70.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.70.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.71.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.71.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.71.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.71.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.71.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.71.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.71.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.71.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.71.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.72.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.72.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.72.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.72.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.72.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.72.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.72.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.72.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.72.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.73.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.73.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.73.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.73.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.73.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.73.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.73.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.73.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.73.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.74.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.74.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.74.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.74.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.74.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.74.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.74.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.74.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.74.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.75.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.75.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.75.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.75.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.75.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.75.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.75.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.75.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.75.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.76.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.76.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.76.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.76.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.76.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.76.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.76.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.76.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.76.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.77.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.77.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.77.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.77.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.77.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.77.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.77.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.77.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.77.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.78.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.78.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.78.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.78.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.78.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.78.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.78.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.78.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.78.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.79.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.79.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.79.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.79.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.79.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.79.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.79.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.79.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.79.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.8.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.8.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.8.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.8.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.8.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.8.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.8.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.8.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.8.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.80.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.80.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.80.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.80.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.80.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.80.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.80.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.80.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.80.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.81.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.81.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.81.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.81.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.81.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.81.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.81.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.81.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.81.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.82.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.82.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.82.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.82.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.82.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.82.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.82.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.82.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.82.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.83.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.83.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.83.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.83.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.83.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.83.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.83.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.83.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.83.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.84.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.84.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.84.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.84.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.84.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.84.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.84.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.84.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.84.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.85.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.85.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.85.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.85.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.85.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.85.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.85.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.85.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.85.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.86.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.86.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.86.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.86.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.86.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.86.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.86.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.86.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.86.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.87.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.87.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.87.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.87.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.87.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.87.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.87.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.87.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.87.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.88.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.88.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.88.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.88.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.88.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.88.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.88.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.88.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.88.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.89.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.89.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.89.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.89.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.89.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.89.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.89.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.89.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.89.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.9.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.9.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.9.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.9.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.9.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.9.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.9.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.9.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.9.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.90.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.90.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.90.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.90.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.90.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.90.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.90.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.90.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.90.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.91.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.91.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.91.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.91.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.91.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.91.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.91.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.91.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.91.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.92.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.92.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.92.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.92.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.92.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.92.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.92.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.92.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.92.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.93.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.93.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.93.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.93.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.93.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.93.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.93.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.93.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.93.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.94.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.94.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.94.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.94.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.94.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.94.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.94.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.94.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.94.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.95.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.95.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.95.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.95.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.95.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.95.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.95.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.95.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.95.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.96.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.96.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.96.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.96.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.96.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.96.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.96.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.96.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.96.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.97.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.97.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.97.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.97.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.97.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.97.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.97.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.97.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.97.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.98.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.98.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.98.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.98.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.98.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.98.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.98.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.98.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.98.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.99.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.99.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.99.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.99.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.99.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.99.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.99.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.experts.99.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.experts.99.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "layers.8.gate.weight": "consolidated-00012-of-00013.safetensors", "layers.8.shared_experts.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.shared_experts.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.shared_experts.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.shared_experts.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.shared_experts.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.shared_experts.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.8.shared_experts.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.8.shared_experts.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.8.shared_experts.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.attention.kv_a_norm.weight": "consolidated-00012-of-00013.safetensors", "layers.9.attention.q_a_norm.weight": "consolidated-00012-of-00013.safetensors", "layers.9.attention.wkv_a_with_mqa.weight": "consolidated-00012-of-00013.safetensors", "layers.9.attention.wkv_b.weight": "consolidated-00012-of-00013.safetensors", "layers.9.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "layers.9.attention.wq_a.weight": "consolidated-00012-of-00013.safetensors", "layers.9.attention.wq_b.weight": "consolidated-00012-of-00013.safetensors", "layers.9.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "layers.9.experts.0.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.0.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.0.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.0.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.0.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.0.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.0.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.0.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.0.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.1.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.1.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.1.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.1.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.1.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.1.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.1.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.1.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.1.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.10.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.10.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.10.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.10.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.10.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.10.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.10.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.10.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.10.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.100.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.100.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.100.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.100.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.100.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.100.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.100.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.100.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.100.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.101.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.101.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.101.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.101.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.101.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.101.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.101.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.101.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.101.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.102.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.102.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.102.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.102.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.102.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.102.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.102.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.102.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.102.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.103.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.103.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.103.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.103.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.103.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.103.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.103.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.103.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.103.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.104.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.104.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.104.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.104.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.104.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.104.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.104.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.104.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.104.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.105.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.105.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.105.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.105.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.105.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.105.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.105.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.105.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.105.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.106.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.106.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.106.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.106.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.106.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.106.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.106.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.106.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.106.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.107.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.107.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.107.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.107.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.107.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.107.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.107.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.107.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.107.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.108.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.108.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.108.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.108.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.108.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.108.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.108.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.108.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.108.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.109.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.109.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.109.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.109.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.109.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.109.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.109.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.109.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.109.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.11.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.11.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.11.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.11.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.11.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.11.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.11.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.11.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.11.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.110.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.110.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.110.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.110.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.110.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.110.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.110.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.110.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.110.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.111.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.111.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.111.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.111.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.111.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.111.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.111.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.111.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.111.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.112.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.112.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.112.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.112.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.112.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.112.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.112.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.112.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.112.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.113.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.113.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.113.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.113.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.113.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.113.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.113.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.113.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.113.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.114.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.114.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.114.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.114.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.114.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.114.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.114.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.114.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.114.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.115.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.115.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.115.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.115.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.115.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.115.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.115.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.115.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.115.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.116.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.116.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.116.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.116.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.116.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.116.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.116.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.116.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.116.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.117.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.117.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.117.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.117.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.117.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.117.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.117.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.117.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.117.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.118.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.118.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.118.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.118.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.118.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.118.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.118.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.118.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.118.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.119.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.119.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.119.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.119.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.119.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.119.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.119.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.119.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.119.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.12.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.12.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.12.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.12.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.12.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.12.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.12.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.12.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.12.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.120.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.120.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.120.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.120.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.120.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.120.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.120.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.120.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.120.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.121.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.121.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.121.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.121.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.121.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.121.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.121.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.121.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.121.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.122.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.122.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.122.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.122.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.122.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.122.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.122.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.122.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.122.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.123.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.123.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.123.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.123.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.123.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.123.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.123.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.123.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.123.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.124.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.124.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.124.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.124.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.124.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.124.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.124.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.124.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.124.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.125.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.125.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.125.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.125.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.125.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.125.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.125.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.125.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.125.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.126.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.126.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.126.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.126.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.126.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.126.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.126.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.126.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.126.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.127.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.127.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.127.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.127.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.127.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.127.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.127.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.127.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.127.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.13.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.13.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.13.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.13.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.13.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.13.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.13.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.13.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.13.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.14.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.14.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.14.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.14.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.14.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.14.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.14.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.14.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.14.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.15.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.15.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.15.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.15.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.15.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.15.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.15.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.15.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.15.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.16.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.16.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.16.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.16.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.16.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.16.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.16.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.16.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.16.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.17.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.17.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.17.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.17.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.17.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.17.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.17.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.17.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.17.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.18.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.18.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.18.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.18.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.18.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.18.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.18.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.18.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.18.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.19.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.19.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.19.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.19.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.19.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.19.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.19.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.19.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.19.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.2.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.2.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.2.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.2.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.2.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.2.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.2.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.2.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.2.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.20.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.20.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.20.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.20.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.20.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.20.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.20.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.20.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.20.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.21.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.21.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.21.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.21.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.21.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.21.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.21.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.21.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.21.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.22.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.22.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.22.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.22.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.22.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.22.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.22.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.22.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.22.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.23.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.23.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.23.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.23.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.23.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.23.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.23.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.23.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.23.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.24.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.24.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.24.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.24.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.24.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.24.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.24.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.24.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.24.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.25.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.25.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.25.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.25.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.25.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.25.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.25.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.25.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.25.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.26.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.26.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.26.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.26.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.26.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.26.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.26.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.26.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.26.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.27.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.27.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.27.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.27.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.27.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.27.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.27.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.27.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.27.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.28.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.28.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.28.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.28.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.28.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.28.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.28.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.28.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.28.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.29.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.29.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.29.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.29.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.29.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.29.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.29.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.29.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.29.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.3.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.3.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.3.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.3.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.3.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.3.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.3.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.3.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.3.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.30.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.30.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.30.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.30.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.30.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.30.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.30.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.30.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.30.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.31.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.31.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.31.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.31.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.31.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.31.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.31.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.31.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.31.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.32.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.32.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.32.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.32.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.32.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.32.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.32.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.32.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.32.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.33.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.33.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.33.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.33.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.33.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.33.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.33.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.33.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.33.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.34.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.34.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.34.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.34.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.34.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.34.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.34.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.34.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.34.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.35.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.35.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.35.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.35.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.35.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.35.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.35.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.35.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.35.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.36.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.36.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.36.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.36.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.36.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.36.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.36.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.36.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.36.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.37.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.37.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.37.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.37.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.37.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.37.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.37.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.37.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.37.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.38.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.38.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.38.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.38.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.38.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.38.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.38.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.38.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.38.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.39.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.39.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.39.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.39.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.39.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.39.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.39.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.39.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.39.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.4.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.4.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.4.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.4.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.4.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.4.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.4.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.4.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.4.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.40.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.40.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.40.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.40.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.40.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.40.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.40.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.40.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.40.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.41.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.41.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.41.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.41.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.41.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.41.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.41.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.41.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.41.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.42.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.42.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.42.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.42.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.42.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.42.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.42.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.42.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.42.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.43.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.43.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.43.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.43.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.43.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.43.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.43.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.43.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.43.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.44.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.44.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.44.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.44.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.44.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.44.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.44.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.44.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.44.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.45.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.45.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.45.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.45.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.45.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.45.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.45.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.45.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.45.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.46.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.46.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.46.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.46.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.46.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.46.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.46.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.46.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.46.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.47.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.47.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.47.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.47.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.47.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.47.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.47.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.47.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.47.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.48.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.48.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.48.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.48.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.48.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.48.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.48.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.48.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.48.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.49.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.49.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.49.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.49.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.49.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.49.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.49.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.49.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.49.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.5.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.5.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.5.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.5.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.5.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.5.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.5.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.5.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.5.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.50.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.50.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.50.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.50.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.50.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.50.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.50.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.50.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.50.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.51.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.51.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.51.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.51.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.51.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.51.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.51.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.51.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.51.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.52.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.52.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.52.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.52.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.52.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.52.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.52.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.52.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.52.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.53.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.53.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.53.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.53.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.53.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.53.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.53.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.53.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.53.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.54.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.54.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.54.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.54.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.54.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.54.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.54.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.54.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.54.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.55.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.55.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.55.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.55.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.55.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.55.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.55.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.55.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.55.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.56.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.56.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.56.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.56.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.56.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.56.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.56.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.56.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.56.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.57.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.57.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.57.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.57.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.57.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.57.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.57.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.57.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.57.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.58.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.58.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.58.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.58.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.58.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.58.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.58.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.58.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.58.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.59.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.59.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.59.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.59.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.59.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.59.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.59.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.59.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.59.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.6.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.6.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.6.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.6.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.6.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.6.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.6.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.6.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.6.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.60.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.60.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.60.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.60.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.60.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.60.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.60.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.60.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.60.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.61.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.61.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.61.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.61.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.61.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.61.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.61.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.61.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.61.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.62.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.62.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.62.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.62.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.62.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.62.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.62.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.62.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.62.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.63.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.63.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.63.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.63.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.63.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.63.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.63.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.63.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.63.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.64.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.64.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.64.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.64.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.64.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.64.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.64.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.64.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.64.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.65.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.65.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.65.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.65.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.65.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.65.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.65.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.65.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.65.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.66.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.66.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.66.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.66.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.66.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.66.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.66.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.66.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.66.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.67.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.67.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.67.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.67.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.67.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.67.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.67.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.67.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.67.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.68.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.68.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.68.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.68.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.68.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.68.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.68.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.68.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.68.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.69.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.69.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.69.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.69.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.69.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.69.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.69.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.69.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.69.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.7.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.7.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.7.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.7.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.7.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.7.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.7.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.7.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.7.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.70.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.70.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.70.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.70.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.70.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.70.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.70.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.70.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.70.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.71.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.71.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.71.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.71.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.71.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.71.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.71.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.71.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.71.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.72.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.72.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.72.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.72.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.72.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.72.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.72.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.72.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.72.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.73.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.73.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.73.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.73.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.73.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.73.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.73.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.73.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.73.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.74.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.74.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.74.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.74.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.74.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.74.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.74.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.74.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.74.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.75.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.75.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.75.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.75.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.75.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.75.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.75.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.75.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.75.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.76.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.76.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.76.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.76.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.76.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.76.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.76.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.76.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.76.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.77.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.77.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.77.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.77.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.77.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.77.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.77.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.77.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.77.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.78.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.78.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.78.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.78.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.78.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.78.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.78.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.78.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.78.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.79.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.79.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.79.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.79.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.79.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.79.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.79.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.79.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.79.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.8.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.8.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.8.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.8.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.8.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.8.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.8.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.8.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.8.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.80.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.80.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.80.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.80.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.80.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.80.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.80.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.80.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.80.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.81.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.81.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.81.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.81.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.81.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.81.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.81.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.81.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.81.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.82.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.82.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.82.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.82.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.82.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.82.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.82.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.82.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.82.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.83.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.83.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.83.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.83.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.83.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.83.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.83.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.83.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.83.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.84.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.84.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.84.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.84.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.84.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.84.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.84.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.84.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.84.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.85.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.85.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.85.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.85.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.85.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.85.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.85.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.85.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.85.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.86.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.86.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.86.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.86.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.86.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.86.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.86.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.86.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.86.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.87.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.87.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.87.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.87.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.87.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.87.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.87.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.87.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.87.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.88.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.88.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.88.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.88.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.88.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.88.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.88.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.88.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.88.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.89.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.89.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.89.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.89.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.89.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.89.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.89.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.89.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.89.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.9.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.9.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.9.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.9.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.9.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.9.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.9.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.9.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.9.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.90.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.90.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.90.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.90.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.90.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.90.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.90.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.90.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.90.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.91.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.91.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.91.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.91.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.91.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.91.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.91.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.91.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.91.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.92.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.92.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.92.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.92.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.92.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.92.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.92.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.92.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.92.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.93.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.93.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.93.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.93.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.93.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.93.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.93.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.93.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.93.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.94.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.94.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.94.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.94.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.94.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.94.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.94.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.94.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.94.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.95.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.95.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.95.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.95.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.95.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.95.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.95.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.95.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.95.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.96.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.96.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.96.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.96.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.96.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.96.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.96.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.96.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.96.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.97.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.97.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.97.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.97.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.97.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.97.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.97.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.97.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.97.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.98.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.98.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.98.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.98.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.98.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.98.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.98.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.98.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.98.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.99.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.99.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.99.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.99.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.99.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.99.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.99.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.experts.99.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.experts.99.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "layers.9.gate.weight": "consolidated-00012-of-00013.safetensors", "layers.9.shared_experts.w1.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.shared_experts.w1.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.shared_experts.w1.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.shared_experts.w2.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.shared_experts.w2.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.shared_experts.w2.weight_scale": "consolidated-00012-of-00013.safetensors", "layers.9.shared_experts.w3.weight_global_scale": "consolidated-00012-of-00013.safetensors", "layers.9.shared_experts.w3.weight_packed": "consolidated-00012-of-00013.safetensors", "layers.9.shared_experts.w3.weight_scale": "consolidated-00012-of-00013.safetensors", "norm.weight": "consolidated-00012-of-00013.safetensors", "output.weight": "consolidated-00012-of-00013.safetensors", "patch_merger.merging_layer.weight": "consolidated-00012-of-00013.safetensors", "pre_mm_projector_norm.weight": "consolidated-00012-of-00013.safetensors", "tok_embeddings.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.ln_pre.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.patch_conv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.0.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.0.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.0.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.0.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.0.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.0.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.0.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.0.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.0.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.1.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.1.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.1.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.1.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.1.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.1.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.1.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.1.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.1.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.10.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.10.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.10.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.10.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.10.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.10.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.10.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.10.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.10.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.11.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.11.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.11.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.11.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.11.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.11.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.11.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.11.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.11.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.12.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.12.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.12.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.12.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.12.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.12.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.12.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.12.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.12.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.13.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.13.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.13.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.13.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.13.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.13.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.13.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.13.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.13.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.14.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.14.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.14.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.14.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.14.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.14.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.14.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.14.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.14.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.15.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.15.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.15.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.15.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.15.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.15.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.15.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.15.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.15.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.16.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.16.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.16.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.16.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.16.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.16.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.16.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.16.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.16.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.17.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.17.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.17.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.17.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.17.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.17.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.17.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.17.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.17.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.18.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.18.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.18.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.18.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.18.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.18.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.18.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.18.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.18.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.19.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.19.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.19.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.19.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.19.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.19.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.19.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.19.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.19.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.2.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.2.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.2.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.2.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.2.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.2.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.2.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.2.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.2.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.20.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.20.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.20.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.20.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.20.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.20.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.20.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.20.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.20.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.21.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.21.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.21.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.21.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.21.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.21.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.21.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.21.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.21.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.22.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.22.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.22.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.22.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.22.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.22.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.22.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.22.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.22.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.23.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.23.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.23.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.23.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.23.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.23.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.23.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.23.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.23.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.3.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.3.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.3.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.3.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.3.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.3.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.3.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.3.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.3.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.4.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.4.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.4.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.4.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.4.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.4.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.4.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.4.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.4.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.5.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.5.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.5.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.5.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.5.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.5.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.5.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.5.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.5.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.6.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.6.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.6.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.6.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.6.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.6.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.6.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.6.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.6.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.7.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.7.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.7.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.7.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.7.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.7.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.7.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.7.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.7.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.8.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.8.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.8.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.8.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.8.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.8.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.8.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.8.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.8.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.9.attention.wk.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.9.attention.wo.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.9.attention.wq.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.9.attention.wv.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.9.attention_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.9.feed_forward.w1.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.9.feed_forward.w2.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.9.feed_forward.w3.weight": "consolidated-00012-of-00013.safetensors", "vision_encoder.transformer.layers.9.ffn_norm.weight": "consolidated-00012-of-00013.safetensors", "vision_language_adapter.w_in.weight": "consolidated-00012-of-00013.safetensors", "vision_language_adapter.w_out.weight": "consolidated-00012-of-00013.safetensors", "layers.0.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.shared_experts.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.shared_experts.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.shared_experts.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.0.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.1.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.2.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.3.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.4.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.5.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.6.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.7.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.8.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.9.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.10.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.11.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.12.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.13.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.14.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.15.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.16.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.17.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.18.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.19.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.20.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.21.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.22.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.23.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.24.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.25.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.26.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.27.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.28.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.29.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.30.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.31.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.32.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.33.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.34.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.0.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.0.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.1.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.1.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.2.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.2.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.3.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.3.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.4.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.4.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.5.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.5.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.6.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.6.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.7.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.7.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.8.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.8.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.9.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.9.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.10.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.10.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.11.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.11.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.12.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.12.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.13.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.13.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.14.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.14.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.15.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.15.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.16.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.16.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.17.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.17.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.18.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.18.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.19.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.19.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.20.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.20.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.21.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.21.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.22.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.22.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.23.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.23.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.24.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.24.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.25.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.25.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.26.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.26.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.27.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.27.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.28.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.28.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.29.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.29.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.30.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.30.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.31.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.31.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.32.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.32.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.33.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.33.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.34.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.34.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.35.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.35.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.36.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.36.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.37.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.37.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.38.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.38.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.39.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.39.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.40.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.40.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.41.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.41.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.42.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.42.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.43.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.43.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.44.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.44.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.45.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.45.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.46.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.46.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.47.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.47.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.48.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.48.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.49.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.49.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.50.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.50.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.51.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.51.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.52.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.52.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.53.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.53.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.54.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.54.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.55.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.55.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.56.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.56.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.57.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.57.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.58.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.58.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.59.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.59.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.60.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.60.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.61.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.61.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.62.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.62.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.63.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.63.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.64.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.64.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.65.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.65.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.66.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.66.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.67.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.67.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.68.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.68.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.69.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.69.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.70.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.70.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.71.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.71.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.72.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.72.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.73.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.73.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.74.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.74.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.75.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.75.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.76.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.76.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.77.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.77.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.78.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.78.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.79.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.79.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.80.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.80.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.81.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.81.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.82.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.82.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.83.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.83.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.84.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.84.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.85.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.85.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.86.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.86.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.87.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.87.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.88.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.88.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.89.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.89.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.90.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.90.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.91.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.91.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.92.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.92.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.93.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.93.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.94.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.94.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.95.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.95.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.96.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.96.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.97.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.97.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.98.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.98.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.99.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.99.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.100.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.100.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.101.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.101.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.102.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.102.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.103.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.103.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.104.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.104.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.105.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.105.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.106.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.106.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.107.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.107.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.108.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.108.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.109.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.109.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.110.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.110.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.111.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.111.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.112.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.112.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.113.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.113.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.114.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.114.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.115.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.115.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.116.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.116.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.117.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.117.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.118.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.118.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.119.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.119.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.120.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.120.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.121.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.121.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.122.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.122.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.123.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.123.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.124.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.124.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.125.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.125.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.126.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.126.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.127.w1.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.127.w3.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.0.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.1.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.2.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.3.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.4.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.5.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.6.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.7.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.8.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.9.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.10.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.11.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.12.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.13.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.14.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.15.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.16.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.17.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.18.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.19.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.20.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.21.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.22.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.23.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.24.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.25.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.26.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.27.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.28.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.29.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.30.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.31.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.32.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.33.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.34.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.35.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.36.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.37.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.38.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.39.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.40.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.41.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.42.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.43.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.44.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.45.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.46.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.47.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.48.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.49.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.50.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.51.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.52.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.53.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.54.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.55.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.56.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.57.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.58.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.59.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.60.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.61.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.62.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.63.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.64.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.65.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.66.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.67.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.68.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.69.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.70.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.71.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.72.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.73.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.74.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.75.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.76.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.77.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.78.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.79.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.80.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.81.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.82.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.83.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.84.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.85.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.86.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.87.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.88.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.89.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.90.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.91.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.92.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.93.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.94.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.95.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.96.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.97.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.98.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.99.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.100.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.101.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.102.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.103.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.104.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.105.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.106.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.107.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.108.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.109.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.110.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.111.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.112.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.113.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.114.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.115.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.116.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.117.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.118.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.119.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.120.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.121.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.122.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.123.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.124.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.125.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.126.w2.input_global_scale": "consolidated-00013-of-00013.safetensors", "layers.35.experts.127.w2.input_global_scale": "consolidated-00013-of-00013.safetensors" } }