@@ -977,15 +977,12 @@ class TensorNameMap:
977
977
"visual.blocks.{bid}.norm2" , # qwen2vl
978
978
),
979
979
980
- # some namings are messed up because the original llava code swapped fc1 and fc2
981
- # we have no better way to fix it, just be careful
982
- # new models like pixtral use the correct naming
983
980
MODEL_TENSOR .V_ENC_FFN_UP : (
984
981
"vision_tower.vision_model.encoder.layers.{bid}.mlp.fc1" ,
985
982
"vpm.encoder.layers.{bid}.mlp.fc1" ,
986
- "model.vision_model.encoder.layers.{bid}.mlp.fc2 " , # SmolVLM, gemma3 (note: name is swapped)
983
+ "model.vision_model.encoder.layers.{bid}.mlp.fc1 " , # SmolVLM, gemma3
987
984
"vision_tower.transformer.layers.{bid}.feed_forward.up_proj" , # pixtral
988
- "visual.blocks.{bid}.mlp.fc2 " , # qwen2vl
985
+ "visual.blocks.{bid}.mlp.fc1 " , # qwen2vl
989
986
"visual.blocks.{bid}.mlp.up_proj" , # qwen2.5vl
990
987
),
991
988
@@ -997,9 +994,9 @@ class TensorNameMap:
997
994
MODEL_TENSOR .V_ENC_FFN_DOWN : (
998
995
"vision_tower.vision_model.encoder.layers.{bid}.mlp.fc2" ,
999
996
"vpm.encoder.layers.{bid}.mlp.fc2" ,
1000
- "model.vision_model.encoder.layers.{bid}.mlp.fc1 " , # SmolVLM, gemma3 (note: name is swapped)
997
+ "model.vision_model.encoder.layers.{bid}.mlp.fc2 " , # SmolVLM, gemma3
1001
998
"vision_tower.transformer.layers.{bid}.feed_forward.down_proj" , # pixtral
1002
- "visual.blocks.{bid}.mlp.fc1 " , # qwen2vl
999
+ "visual.blocks.{bid}.mlp.fc2 " , # qwen2vl
1003
1000
"visual.blocks.{bid}.mlp.down_proj" , # qwen2.5vl
1004
1001
),
1005
1002
0 commit comments