kosmos-2.5 / model.safetensors.index.json
Ubuntu
add hf
f29bcc9
{
"metadata": {
"total_size": 5498585088
},
"weight_map": {
"image_to_text_projection.dense.bias": "model-00002-of-00002.safetensors",
"image_to_text_projection.dense.weight": "model-00002-of-00002.safetensors",
"image_to_text_projection.latent_query": "model-00002-of-00002.safetensors",
"image_to_text_projection.x_attn.k_proj.bias": "model-00002-of-00002.safetensors",
"image_to_text_projection.x_attn.k_proj.weight": "model-00002-of-00002.safetensors",
"image_to_text_projection.x_attn.out_proj.bias": "model-00002-of-00002.safetensors",
"image_to_text_projection.x_attn.out_proj.weight": "model-00002-of-00002.safetensors",
"image_to_text_projection.x_attn.q_proj.bias": "model-00002-of-00002.safetensors",
"image_to_text_projection.x_attn.q_proj.weight": "model-00002-of-00002.safetensors",
"image_to_text_projection.x_attn.v_proj.bias": "model-00002-of-00002.safetensors",
"image_to_text_projection.x_attn.v_proj.weight": "model-00002-of-00002.safetensors",
"text_model.model.embed_tokens.weight": "model-00001-of-00002.safetensors",
"text_model.model.layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.0.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.1.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.10.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.11.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.12.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.13.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.14.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.15.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.16.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.17.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.18.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.19.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.2.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.20.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.21.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.22.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.23.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.3.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.4.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.5.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.6.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.7.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.8.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.ffn.fc1.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.ffn.fc1.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.ffn.fc2.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.ffn.fc2.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.ffn.ffn_layernorm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.ffn.ffn_layernorm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.final_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.final_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
"text_model.model.layers.9.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
"text_model.model.segment_emb.weight": "model-00001-of-00002.safetensors",
"vision_model.embeddings.column_embedder.weight": "model-00001-of-00002.safetensors",
"vision_model.embeddings.patch_projection.bias": "model-00001-of-00002.safetensors",
"vision_model.embeddings.patch_projection.weight": "model-00001-of-00002.safetensors",
"vision_model.embeddings.row_embedder.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.0.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.0.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.0.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.0.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.0.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.0.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.0.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.0.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.0.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.1.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.1.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.1.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.1.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.1.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.1.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.1.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.1.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.1.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.10.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.10.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.10.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.10.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.10.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.10.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.10.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.10.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.10.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.11.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.11.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.11.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.11.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.11.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.11.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.11.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.11.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.11.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.12.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.12.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.12.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.12.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.12.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.12.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.12.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.12.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.12.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.13.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.13.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.13.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.13.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.13.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.13.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.13.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.13.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.13.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.14.attention.key.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.14.attention.output.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.14.attention.query.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.14.attention.value.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.14.mlp.wi_0.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.14.mlp.wi_1.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.14.mlp.wo.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.14.pre_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.14.pre_mlp_layer_norm.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.15.attention.key.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.15.attention.output.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.15.attention.query.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.15.attention.value.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.15.mlp.wi_0.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.15.mlp.wi_1.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.15.mlp.wo.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.15.pre_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.15.pre_mlp_layer_norm.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.16.attention.key.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.16.attention.output.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.16.attention.query.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.16.attention.value.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.16.mlp.wi_0.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.16.mlp.wi_1.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.16.mlp.wo.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.16.pre_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.16.pre_mlp_layer_norm.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.17.attention.key.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.17.attention.output.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.17.attention.query.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.17.attention.value.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.17.mlp.wi_0.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.17.mlp.wi_1.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.17.mlp.wo.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.17.pre_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.17.pre_mlp_layer_norm.weight": "model-00002-of-00002.safetensors",
"vision_model.encoder.layer.2.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.2.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.2.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.2.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.2.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.2.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.2.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.2.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.2.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.3.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.3.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.3.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.3.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.3.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.3.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.3.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.3.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.3.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.4.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.4.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.4.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.4.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.4.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.4.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.4.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.4.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.4.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.5.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.5.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.5.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.5.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.5.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.5.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.5.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.5.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.5.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.6.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.6.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.6.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.6.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.6.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.6.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.6.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.6.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.6.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.7.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.7.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.7.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.7.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.7.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.7.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.7.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.7.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.7.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.8.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.8.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.8.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.8.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.8.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.8.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.8.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.8.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.8.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.9.attention.key.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.9.attention.output.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.9.attention.query.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.9.attention.value.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.9.mlp.wi_0.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.9.mlp.wi_1.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.9.mlp.wo.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.9.pre_attention_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.encoder.layer.9.pre_mlp_layer_norm.weight": "model-00001-of-00002.safetensors",
"vision_model.layernorm.weight": "model-00002-of-00002.safetensors"
}
}