Safetensors
English
Infinity / infinity_8b_weights /model.safetensors.index.json
hanjian.thu123
[update] add infinity_8b_weights
9fe79d8
{
"metadata": {
"total_size": 33504330240
},
"weight_map": {
"block_chunks.0.module.0.ada_gss": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ada_gss": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.sa.scale_mul_1H11": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.sa.q_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.sa.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.sa.mat_qkv.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.sa.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.sa.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ca.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ca.mat_q.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ca.mat_q.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ca.mat_kv.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ca.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ca.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ffn.fc1.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ffn.fc1.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ffn.fc2.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ffn.fc2.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ca_norm.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.0.ca_norm.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ada_gss": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.sa.scale_mul_1H11": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.sa.q_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.sa.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.sa.mat_qkv.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.sa.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.sa.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ca.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ca.mat_q.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ca.mat_q.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ca.mat_kv.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ca.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ca.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ffn.fc1.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ffn.fc1.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ffn.fc2.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ffn.fc2.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ca_norm.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.1.ca_norm.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ada_gss": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.sa.scale_mul_1H11": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.sa.q_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.sa.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.sa.mat_qkv.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.sa.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.sa.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ca.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ca.mat_q.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ca.mat_q.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ca.mat_kv.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ca.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ca.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ffn.fc1.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ffn.fc1.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ffn.fc2.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ffn.fc2.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ca_norm.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.2.ca_norm.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ada_gss": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.sa.scale_mul_1H11": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.sa.q_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.sa.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.sa.mat_qkv.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.sa.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.sa.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ca.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ca.mat_q.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ca.mat_q.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ca.mat_kv.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ca.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ca.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ffn.fc1.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ffn.fc1.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ffn.fc2.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ffn.fc2.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ca_norm.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.3.ca_norm.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ada_gss": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.sa.scale_mul_1H11": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.sa.q_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.sa.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.sa.mat_qkv.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.sa.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.sa.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ca.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ca.mat_q.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ca.mat_q.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ca.mat_kv.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ca.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ca.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ffn.fc1.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ffn.fc1.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ffn.fc2.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ffn.fc2.bias": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ca_norm.weight": "model-00001-of-00004.safetensors",
"block_chunks.0.module.4.ca_norm.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.sa.scale_mul_1H11": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.sa.q_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.sa.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.sa.mat_qkv.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.sa.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.sa.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ca.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ca.mat_q.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ca.mat_q.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ca.mat_kv.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ca.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ca.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ffn.fc1.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ffn.fc1.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ffn.fc2.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ffn.fc2.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ca_norm.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.0.ca_norm.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ada_gss": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.sa.scale_mul_1H11": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.sa.q_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.sa.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.sa.mat_qkv.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.sa.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.sa.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ca.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ca.mat_q.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ca.mat_q.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ca.mat_kv.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ca.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ca.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ffn.fc1.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ffn.fc1.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ffn.fc2.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ffn.fc2.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ca_norm.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.1.ca_norm.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ada_gss": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.sa.scale_mul_1H11": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.sa.q_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.sa.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.sa.mat_qkv.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.sa.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.sa.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ca.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ca.mat_q.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ca.mat_q.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ca.mat_kv.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ca.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ca.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ffn.fc1.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ffn.fc1.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ffn.fc2.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ffn.fc2.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ca_norm.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.2.ca_norm.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ada_gss": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.sa.scale_mul_1H11": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.sa.q_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.sa.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.sa.mat_qkv.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.sa.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.sa.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ca.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ca.mat_q.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ca.mat_q.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ca.mat_kv.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ca.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ca.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ffn.fc1.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ffn.fc1.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ffn.fc2.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ffn.fc2.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ca_norm.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.3.ca_norm.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ada_gss": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.sa.scale_mul_1H11": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.sa.q_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.sa.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.sa.mat_qkv.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.sa.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.sa.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ca.v_bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ca.mat_q.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ca.mat_q.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ca.mat_kv.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ca.proj.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ca.proj.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ffn.fc1.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ffn.fc1.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ffn.fc2.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ffn.fc2.bias": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ca_norm.weight": "model-00001-of-00004.safetensors",
"block_chunks.1.module.4.ca_norm.bias": "model-00001-of-00004.safetensors",
"block_chunks.2.module.0.ada_gss": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ada_gss": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.sa.scale_mul_1H11": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.sa.q_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.sa.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.sa.mat_qkv.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.sa.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.sa.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ca.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ca.mat_q.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ca.mat_q.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ca.mat_kv.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ca.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ca.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ffn.fc1.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ffn.fc1.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ffn.fc2.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ffn.fc2.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ca_norm.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.0.ca_norm.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ada_gss": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.sa.scale_mul_1H11": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.sa.q_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.sa.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.sa.mat_qkv.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.sa.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.sa.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ca.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ca.mat_q.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ca.mat_q.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ca.mat_kv.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ca.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ca.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ffn.fc1.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ffn.fc1.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ffn.fc2.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ffn.fc2.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ca_norm.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.1.ca_norm.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ada_gss": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.sa.scale_mul_1H11": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.sa.q_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.sa.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.sa.mat_qkv.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.sa.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.sa.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ca.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ca.mat_q.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ca.mat_q.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ca.mat_kv.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ca.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ca.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ffn.fc1.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ffn.fc1.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ffn.fc2.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ffn.fc2.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ca_norm.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.2.ca_norm.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ada_gss": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.sa.scale_mul_1H11": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.sa.q_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.sa.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.sa.mat_qkv.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.sa.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.sa.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ca.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ca.mat_q.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ca.mat_q.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ca.mat_kv.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ca.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ca.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ffn.fc1.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ffn.fc1.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ffn.fc2.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ffn.fc2.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ca_norm.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.3.ca_norm.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ada_gss": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.sa.scale_mul_1H11": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.sa.q_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.sa.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.sa.mat_qkv.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.sa.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.sa.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ca.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ca.mat_q.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ca.mat_q.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ca.mat_kv.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ca.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ca.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ffn.fc1.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ffn.fc1.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ffn.fc2.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ffn.fc2.bias": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ca_norm.weight": "model-00002-of-00004.safetensors",
"block_chunks.2.module.4.ca_norm.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.sa.scale_mul_1H11": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.sa.q_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.sa.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.sa.mat_qkv.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.sa.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.sa.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ca.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ca.mat_q.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ca.mat_q.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ca.mat_kv.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ca.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ca.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ffn.fc1.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ffn.fc1.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ffn.fc2.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ffn.fc2.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ca_norm.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.0.ca_norm.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ada_gss": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.sa.scale_mul_1H11": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.sa.q_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.sa.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.sa.mat_qkv.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.sa.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.sa.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ca.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ca.mat_q.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ca.mat_q.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ca.mat_kv.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ca.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ca.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ffn.fc1.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ffn.fc1.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ffn.fc2.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ffn.fc2.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ca_norm.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.1.ca_norm.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ada_gss": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.sa.scale_mul_1H11": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.sa.q_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.sa.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.sa.mat_qkv.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.sa.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.sa.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ca.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ca.mat_q.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ca.mat_q.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ca.mat_kv.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ca.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ca.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ffn.fc1.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ffn.fc1.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ffn.fc2.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ffn.fc2.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ca_norm.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.2.ca_norm.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ada_gss": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.sa.scale_mul_1H11": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.sa.q_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.sa.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.sa.mat_qkv.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.sa.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.sa.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ca.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ca.mat_q.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ca.mat_q.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ca.mat_kv.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ca.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ca.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ffn.fc1.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ffn.fc1.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ffn.fc2.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ffn.fc2.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ca_norm.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.3.ca_norm.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ada_gss": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.sa.scale_mul_1H11": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.sa.q_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.sa.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.sa.mat_qkv.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.sa.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.sa.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ca.v_bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ca.mat_q.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ca.mat_q.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ca.mat_kv.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ca.proj.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ca.proj.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ffn.fc1.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ffn.fc1.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ffn.fc2.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ffn.fc2.bias": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ca_norm.weight": "model-00002-of-00004.safetensors",
"block_chunks.3.module.4.ca_norm.bias": "model-00002-of-00004.safetensors",
"block_chunks.4.module.0.ada_gss": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ada_gss": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.sa.scale_mul_1H11": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.sa.q_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.sa.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.sa.mat_qkv.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.sa.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.sa.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ca.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ca.mat_q.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ca.mat_q.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ca.mat_kv.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ca.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ca.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ffn.fc1.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ffn.fc1.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ffn.fc2.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ffn.fc2.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ca_norm.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.0.ca_norm.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ada_gss": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.sa.scale_mul_1H11": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.sa.q_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.sa.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.sa.mat_qkv.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.sa.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.sa.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ca.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ca.mat_q.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ca.mat_q.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ca.mat_kv.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ca.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ca.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ffn.fc1.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ffn.fc1.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ffn.fc2.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ffn.fc2.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ca_norm.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.1.ca_norm.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ada_gss": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.sa.scale_mul_1H11": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.sa.q_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.sa.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.sa.mat_qkv.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.sa.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.sa.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ca.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ca.mat_q.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ca.mat_q.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ca.mat_kv.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ca.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ca.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ffn.fc1.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ffn.fc1.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ffn.fc2.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ffn.fc2.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ca_norm.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.2.ca_norm.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ada_gss": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.sa.scale_mul_1H11": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.sa.q_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.sa.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.sa.mat_qkv.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.sa.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.sa.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ca.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ca.mat_q.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ca.mat_q.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ca.mat_kv.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ca.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ca.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ffn.fc1.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ffn.fc1.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ffn.fc2.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ffn.fc2.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ca_norm.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.3.ca_norm.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ada_gss": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.sa.scale_mul_1H11": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.sa.q_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.sa.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.sa.mat_qkv.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.sa.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.sa.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ca.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ca.mat_q.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ca.mat_q.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ca.mat_kv.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ca.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ca.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ffn.fc1.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ffn.fc1.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ffn.fc2.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ffn.fc2.bias": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ca_norm.weight": "model-00003-of-00004.safetensors",
"block_chunks.4.module.4.ca_norm.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.sa.scale_mul_1H11": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.sa.q_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.sa.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.sa.mat_qkv.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.sa.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.sa.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ca.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ca.mat_q.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ca.mat_q.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ca.mat_kv.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ca.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ca.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ffn.fc1.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ffn.fc1.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ffn.fc2.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ffn.fc2.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ca_norm.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.0.ca_norm.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ada_gss": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.sa.scale_mul_1H11": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.sa.q_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.sa.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.sa.mat_qkv.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.sa.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.sa.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ca.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ca.mat_q.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ca.mat_q.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ca.mat_kv.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ca.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ca.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ffn.fc1.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ffn.fc1.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ffn.fc2.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ffn.fc2.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ca_norm.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.1.ca_norm.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ada_gss": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.sa.scale_mul_1H11": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.sa.q_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.sa.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.sa.mat_qkv.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.sa.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.sa.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ca.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ca.mat_q.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ca.mat_q.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ca.mat_kv.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ca.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ca.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ffn.fc1.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ffn.fc1.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ffn.fc2.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ffn.fc2.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ca_norm.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.2.ca_norm.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ada_gss": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.sa.scale_mul_1H11": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.sa.q_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.sa.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.sa.mat_qkv.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.sa.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.sa.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ca.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ca.mat_q.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ca.mat_q.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ca.mat_kv.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ca.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ca.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ffn.fc1.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ffn.fc1.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ffn.fc2.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ffn.fc2.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ca_norm.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.3.ca_norm.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ada_gss": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.sa.scale_mul_1H11": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.sa.q_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.sa.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.sa.mat_qkv.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.sa.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.sa.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ca.v_bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ca.mat_q.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ca.mat_q.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ca.mat_kv.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ca.proj.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ca.proj.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ffn.fc1.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ffn.fc1.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ffn.fc2.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ffn.fc2.bias": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ca_norm.weight": "model-00003-of-00004.safetensors",
"block_chunks.5.module.4.ca_norm.bias": "model-00003-of-00004.safetensors",
"block_chunks.6.module.0.ada_gss": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ada_gss": "model-00004-of-00004.safetensors",
"text_norm.weight": "model-00004-of-00004.safetensors",
"text_proj_for_sos.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.0.module.0.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.0.module.0.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.0.module.1.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.0.module.1.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.0.module.2.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.0.module.2.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.0.module.3.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.0.module.3.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.0.module.4.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.0.module.4.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.1.module.0.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.1.module.0.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.1.module.1.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.1.module.1.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.1.module.2.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.1.module.2.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.1.module.3.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.1.module.3.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.1.module.4.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.1.module.4.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.2.module.0.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.2.module.0.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.2.module.1.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.2.module.1.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.2.module.2.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.2.module.2.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.2.module.3.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.2.module.3.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.2.module.4.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.2.module.4.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.3.module.0.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.3.module.0.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.3.module.1.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.3.module.1.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.3.module.2.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.3.module.2.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.3.module.3.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.3.module.3.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.3.module.4.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.3.module.4.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.4.module.0.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.4.module.0.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.4.module.1.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.4.module.1.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.4.module.2.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.4.module.2.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.4.module.3.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.4.module.3.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.4.module.4.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.4.module.4.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.5.module.0.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.5.module.0.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.5.module.1.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.5.module.1.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.5.module.2.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.5.module.2.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.5.module.3.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.5.module.3.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.5.module.4.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.5.module.4.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.sa.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ca.zero_k_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.sa.scale_mul_1H11": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.sa.q_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.sa.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.sa.mat_qkv.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.sa.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.sa.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ca.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ca.mat_q.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ca.mat_q.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ca.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ca.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ffn.fc1.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ffn.fc1.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ffn.fc2.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ffn.fc2.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ca_norm.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.0.ca_norm.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ada_gss": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.sa.scale_mul_1H11": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.sa.q_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.sa.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.sa.mat_qkv.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.sa.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.sa.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ca.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ca.mat_q.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ca.mat_q.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ca.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ca.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ffn.fc1.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ffn.fc1.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ffn.fc2.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ffn.fc2.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ca_norm.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.1.ca_norm.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ada_gss": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.sa.scale_mul_1H11": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.sa.q_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.sa.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.sa.mat_qkv.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.sa.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.sa.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ca.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ca.mat_q.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ca.mat_q.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ca.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ca.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ffn.fc1.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ffn.fc1.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ffn.fc2.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ffn.fc2.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ca_norm.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.2.ca_norm.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ada_gss": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.sa.scale_mul_1H11": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.sa.q_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.sa.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.sa.mat_qkv.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.sa.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.sa.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ca.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ca.mat_q.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ca.mat_q.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ca.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ca.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ffn.fc1.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ffn.fc1.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ffn.fc2.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ffn.fc2.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ca_norm.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.3.ca_norm.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ada_gss": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.sa.scale_mul_1H11": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.sa.q_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.sa.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.sa.mat_qkv.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.sa.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.sa.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ca.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ca.mat_q.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ca.mat_q.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ca.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ca.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ffn.fc1.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ffn.fc1.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ffn.fc2.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ffn.fc2.bias": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ca_norm.weight": "model-00004-of-00004.safetensors",
"block_chunks.6.module.4.ca_norm.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.sa.scale_mul_1H11": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.sa.q_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.sa.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.sa.mat_qkv.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.sa.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.sa.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ca.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ca.mat_q.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ca.mat_q.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ca.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ca.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ffn.fc1.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ffn.fc1.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ffn.fc2.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ffn.fc2.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ca_norm.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.0.ca_norm.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ada_gss": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.sa.scale_mul_1H11": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.sa.q_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.sa.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.sa.mat_qkv.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.sa.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.sa.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ca.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ca.mat_q.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ca.mat_q.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ca.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ca.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ffn.fc1.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ffn.fc1.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ffn.fc2.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ffn.fc2.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ca_norm.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.1.ca_norm.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ada_gss": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.sa.scale_mul_1H11": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.sa.q_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.sa.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.sa.mat_qkv.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.sa.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.sa.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ca.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ca.mat_q.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ca.mat_q.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ca.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ca.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ffn.fc1.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ffn.fc1.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ffn.fc2.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ffn.fc2.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ca_norm.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.2.ca_norm.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ada_gss": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.sa.scale_mul_1H11": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.sa.q_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.sa.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.sa.mat_qkv.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.sa.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.sa.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ca.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ca.mat_q.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ca.mat_q.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ca.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ca.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ffn.fc1.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ffn.fc1.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ffn.fc2.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ffn.fc2.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ca_norm.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.3.ca_norm.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ada_gss": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.sa.scale_mul_1H11": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.sa.q_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.sa.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.sa.mat_qkv.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.sa.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.sa.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ca.v_bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ca.mat_q.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ca.mat_q.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ca.proj.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ca.proj.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ffn.fc1.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ffn.fc1.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ffn.fc2.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ffn.fc2.bias": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ca_norm.weight": "model-00004-of-00004.safetensors",
"block_chunks.7.module.4.ca_norm.bias": "model-00004-of-00004.safetensors",
"text_proj_for_sos.ca.mat_q": "model-00004-of-00004.safetensors",
"text_proj_for_sos.ca.v_bias": "model-00004-of-00004.safetensors",
"text_proj_for_sos.ca.mat_kv.weight": "model-00004-of-00004.safetensors",
"text_proj_for_sos.ca.proj.weight": "model-00004-of-00004.safetensors",
"text_proj_for_sos.ca.proj.bias": "model-00004-of-00004.safetensors",
"text_proj_for_ca.0.weight": "model-00004-of-00004.safetensors",
"text_proj_for_ca.0.bias": "model-00004-of-00004.safetensors",
"text_proj_for_ca.2.weight": "model-00004-of-00004.safetensors",
"text_proj_for_ca.2.bias": "model-00004-of-00004.safetensors",
"lvl_embed.weight": "model-00004-of-00004.safetensors",
"word_embed.weight": "model-00004-of-00004.safetensors",
"word_embed.bias": "model-00004-of-00004.safetensors",
"shared_ada_lin.1.weight": "model-00004-of-00004.safetensors",
"shared_ada_lin.1.bias": "model-00004-of-00004.safetensors",
"head_nm.ada_lin.1.weight": "model-00004-of-00004.safetensors",
"head_nm.ada_lin.1.bias": "model-00004-of-00004.safetensors",
"head.weight": "model-00004-of-00004.safetensors",
"head.bias": "model-00004-of-00004.safetensors",
"cfg_uncond": "model-00004-of-00004.safetensors",
"pos_start": "model-00004-of-00004.safetensors"
}
}