{ "metadata": { "total_size": 8516804608 }, "weight_map": { "model.embed_tokens.biases": "model-00001-of-00002.safetensors", "model.embed_tokens.scales": "model-00001-of-00002.safetensors", "model.embed_tokens.weight": "model-00001-of-00002.safetensors", "model.layers.0.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.0.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.0.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.0.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.0.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.0.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.0.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.0.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.0.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.0.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.0.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.0.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.0.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.0.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.0.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.0.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.0.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.0.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.0.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.0.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.0.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.0.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.0.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.1.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.1.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.1.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.1.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.1.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.1.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.1.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.1.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.1.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.1.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.1.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.1.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.1.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.1.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.1.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.1.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.1.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.1.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.1.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.1.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.1.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.1.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.1.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.10.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.10.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.10.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.10.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.10.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.10.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.10.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.10.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.10.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.10.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.10.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.10.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.10.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.10.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.10.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.10.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.10.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.10.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.10.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.10.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.10.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.10.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.10.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.11.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.11.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.11.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.11.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.11.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.11.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.11.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.11.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.11.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.11.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.11.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.11.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.11.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.11.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.11.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.11.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.11.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.11.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.11.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.11.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.11.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.11.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.11.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.12.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.12.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.12.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.12.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.12.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.12.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.12.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.12.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.12.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.12.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.12.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.12.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.12.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.12.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.12.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.12.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.12.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.12.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.12.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.12.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.12.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.12.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.12.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.13.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.13.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.13.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.13.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.13.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.13.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.13.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.13.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.13.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.13.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.13.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.13.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.13.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.13.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.13.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.13.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.13.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.13.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.13.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.13.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.13.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.13.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.13.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.14.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.14.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.14.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.14.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.14.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.14.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.14.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.14.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.14.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.14.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.14.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.14.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.14.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.14.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.14.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.14.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.14.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.14.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.14.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.14.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.14.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.14.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.14.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.15.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.15.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.15.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.15.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.15.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.15.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.15.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.15.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.15.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.15.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.15.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.15.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.15.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.15.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.15.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.15.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.15.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.15.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.15.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.15.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.15.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.15.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.15.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.16.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.16.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.16.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.16.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.16.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.16.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.16.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.16.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.16.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.16.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.16.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.16.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.16.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.16.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.16.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.16.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.16.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.16.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.16.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.16.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.16.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.16.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.16.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.17.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.17.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.17.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.17.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.17.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.17.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.17.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.17.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.17.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.17.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.17.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.17.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.17.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.17.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.17.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.17.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.17.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.17.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.17.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.17.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.17.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.17.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.17.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.18.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.18.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.18.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.18.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.18.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.18.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.18.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.18.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.18.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.18.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.18.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.18.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.18.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.18.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.18.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.18.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.18.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.18.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.18.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.18.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.18.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.18.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.18.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.19.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.19.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.19.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.19.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.19.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.19.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.19.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.19.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.19.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.19.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.19.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.19.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.19.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.19.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.19.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.19.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.19.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.19.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.19.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.19.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.19.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.19.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.19.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.2.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.2.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.2.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.2.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.2.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.2.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.2.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.2.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.2.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.2.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.2.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.2.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.2.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.2.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.2.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.2.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.2.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.2.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.2.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.2.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.2.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.2.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.2.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.20.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.20.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.20.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.20.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.20.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.20.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.20.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.20.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.20.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.20.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.20.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.20.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.20.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.20.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.20.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.20.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.20.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.20.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.20.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.20.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.20.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.20.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.20.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.21.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.21.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.21.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.21.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.21.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.21.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.21.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.21.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.21.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.21.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.21.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.21.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.21.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.21.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.21.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.21.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.21.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.21.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.21.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.21.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.21.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.21.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.21.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.22.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.22.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.22.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.22.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.22.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.22.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.22.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.22.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.22.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.22.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.22.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.22.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.22.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.22.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.22.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.22.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.22.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.22.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.22.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.22.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.22.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.22.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.22.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.23.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.23.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.23.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.23.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.23.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.23.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.23.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.23.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.23.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.23.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.23.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.23.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.23.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.23.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.23.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.23.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.23.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.23.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.23.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.23.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.23.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.23.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.23.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.24.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.24.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.24.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.24.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.24.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.24.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.24.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.24.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.24.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.24.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.24.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.24.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.24.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.24.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.24.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.24.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.24.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.24.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.24.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.24.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.24.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.24.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.24.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.25.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.25.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.25.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.25.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.25.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.25.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.25.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.25.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.25.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.25.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.25.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.25.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.25.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.25.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.25.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.25.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.25.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.25.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.25.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.25.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.25.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.25.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.25.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.26.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.26.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.26.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.26.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.26.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.26.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.26.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.26.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.26.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.26.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.26.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.26.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.26.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.26.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.26.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.26.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.26.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.26.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.26.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.26.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.26.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.26.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.26.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.27.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.27.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.27.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.27.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.27.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.27.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.27.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.27.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.27.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.27.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.27.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.27.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.27.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.27.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.27.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.27.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.27.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.27.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.27.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.27.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.27.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.27.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.27.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.28.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.28.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.28.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.28.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.28.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.28.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.28.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.28.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.28.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.28.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.28.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.28.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.28.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.28.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.28.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.28.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.28.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.28.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.28.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.28.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.28.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.28.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.28.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.29.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.29.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.29.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.29.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.29.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.29.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.29.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.29.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.29.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.29.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.29.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.29.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.29.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.29.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.29.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.29.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.29.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.29.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.29.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.29.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.29.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.29.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.29.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.3.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.3.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.3.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.3.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.3.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.3.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.3.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.3.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.3.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.3.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.3.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.3.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.3.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.3.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.3.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.3.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.3.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.3.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.3.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.3.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.3.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.3.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.3.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.30.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.30.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.30.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.30.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.30.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.30.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.30.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.30.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.30.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.30.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.30.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.30.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.30.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.30.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.30.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.30.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.30.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.30.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.30.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.30.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.30.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.30.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.30.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.31.attn_norm.weight": "model-00002-of-00002.safetensors", "model.layers.31.attn_out.biases": "model-00002-of-00002.safetensors", "model.layers.31.attn_out.scales": "model-00002-of-00002.safetensors", "model.layers.31.attn_out.weight": "model-00002-of-00002.safetensors", "model.layers.31.ff_norm.weight": "model-00002-of-00002.safetensors", "model.layers.31.ff_out.biases": "model-00002-of-00002.safetensors", "model.layers.31.ff_out.scales": "model-00002-of-00002.safetensors", "model.layers.31.ff_out.weight": "model-00002-of-00002.safetensors", "model.layers.31.ff_proj.biases": "model-00002-of-00002.safetensors", "model.layers.31.ff_proj.scales": "model-00002-of-00002.safetensors", "model.layers.31.ff_proj.weight": "model-00002-of-00002.safetensors", "model.layers.31.k_proj.biases": "model-00002-of-00002.safetensors", "model.layers.31.k_proj.scales": "model-00002-of-00002.safetensors", "model.layers.31.k_proj.weight": "model-00002-of-00002.safetensors", "model.layers.31.q_proj.biases": "model-00002-of-00002.safetensors", "model.layers.31.q_proj.scales": "model-00002-of-00002.safetensors", "model.layers.31.q_proj.weight": "model-00002-of-00002.safetensors", "model.layers.31.up_proj.biases": "model-00002-of-00002.safetensors", "model.layers.31.up_proj.scales": "model-00002-of-00002.safetensors", "model.layers.31.up_proj.weight": "model-00002-of-00002.safetensors", "model.layers.31.v_proj.biases": "model-00002-of-00002.safetensors", "model.layers.31.v_proj.scales": "model-00002-of-00002.safetensors", "model.layers.31.v_proj.weight": "model-00002-of-00002.safetensors", "model.layers.4.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.4.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.4.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.4.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.4.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.4.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.4.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.4.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.4.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.4.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.4.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.4.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.4.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.4.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.4.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.4.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.4.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.4.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.4.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.4.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.4.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.4.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.4.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.5.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.5.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.5.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.5.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.5.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.5.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.5.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.5.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.5.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.5.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.5.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.5.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.5.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.5.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.5.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.5.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.5.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.5.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.5.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.5.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.5.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.5.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.5.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.6.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.6.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.6.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.6.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.6.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.6.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.6.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.6.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.6.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.6.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.6.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.6.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.6.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.6.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.6.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.6.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.6.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.6.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.6.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.6.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.6.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.6.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.6.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.7.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.7.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.7.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.7.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.7.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.7.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.7.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.7.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.7.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.7.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.7.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.7.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.7.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.7.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.7.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.7.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.7.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.7.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.7.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.7.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.7.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.7.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.7.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.8.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.8.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.8.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.8.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.8.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.8.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.8.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.8.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.8.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.8.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.8.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.8.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.8.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.8.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.8.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.8.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.8.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.8.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.8.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.8.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.8.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.8.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.8.v_proj.weight": "model-00001-of-00002.safetensors", "model.layers.9.attn_norm.weight": "model-00001-of-00002.safetensors", "model.layers.9.attn_out.biases": "model-00001-of-00002.safetensors", "model.layers.9.attn_out.scales": "model-00001-of-00002.safetensors", "model.layers.9.attn_out.weight": "model-00001-of-00002.safetensors", "model.layers.9.ff_norm.weight": "model-00001-of-00002.safetensors", "model.layers.9.ff_out.biases": "model-00001-of-00002.safetensors", "model.layers.9.ff_out.scales": "model-00001-of-00002.safetensors", "model.layers.9.ff_out.weight": "model-00001-of-00002.safetensors", "model.layers.9.ff_proj.biases": "model-00001-of-00002.safetensors", "model.layers.9.ff_proj.scales": "model-00001-of-00002.safetensors", "model.layers.9.ff_proj.weight": "model-00001-of-00002.safetensors", "model.layers.9.k_proj.biases": "model-00001-of-00002.safetensors", "model.layers.9.k_proj.scales": "model-00001-of-00002.safetensors", "model.layers.9.k_proj.weight": "model-00001-of-00002.safetensors", "model.layers.9.q_proj.biases": "model-00001-of-00002.safetensors", "model.layers.9.q_proj.scales": "model-00001-of-00002.safetensors", "model.layers.9.q_proj.weight": "model-00001-of-00002.safetensors", "model.layers.9.up_proj.biases": "model-00001-of-00002.safetensors", "model.layers.9.up_proj.scales": "model-00001-of-00002.safetensors", "model.layers.9.up_proj.weight": "model-00001-of-00002.safetensors", "model.layers.9.v_proj.biases": "model-00001-of-00002.safetensors", "model.layers.9.v_proj.scales": "model-00001-of-00002.safetensors", "model.layers.9.v_proj.weight": "model-00001-of-00002.safetensors", "model.lm_head.biases": "model-00002-of-00002.safetensors", "model.lm_head.scales": "model-00002-of-00002.safetensors", "model.lm_head.weight": "model-00002-of-00002.safetensors", "model.norm.weight": "model-00002-of-00002.safetensors" } }