Skip to content

Commit be7d1a9

Browse files
kaln27Cyrilvallez
authored andcommitted
Fix errors when use verl to train GLM4.1v model (#39199)
* Fix errors when use verl to train GLM4.1v model * Support glm4v load from AutoModelForVision2Seq * Set glm4v model _checkpoint_conversion_mapping attr from None to {} * Update modeling_auto.py
1 parent 6023ca8 commit be7d1a9

File tree

2 files changed

+4
-4
lines changed

2 files changed

+4
-4
lines changed

src/transformers/models/glm4v/modeling_glm4v.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -940,7 +940,7 @@ def forward(
940940
@auto_docstring
941941
class Glm4vModel(Glm4vPreTrainedModel):
942942
base_model_prefix = ""
943-
_checkpoint_conversion_mapping = None
943+
_checkpoint_conversion_mapping = {}
944944
config_class = Glm4vConfig
945945
_no_split_modules = ["Glm4vTextDecoderLayer", "Glm4vVisionBlock"]
946946

@@ -1364,7 +1364,7 @@ class Glm4vCausalLMOutputWithPast(ModelOutput):
13641364

13651365

13661366
class Glm4vForConditionalGeneration(Glm4vPreTrainedModel, GenerationMixin):
1367-
_checkpoint_conversion_mapping = None
1367+
_checkpoint_conversion_mapping = {}
13681368
_tied_weights_keys = ["lm_head.weight"]
13691369

13701370
def __init__(self, config):

src/transformers/models/glm4v/modular_glm4v.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1049,7 +1049,7 @@ def forward(
10491049

10501050

10511051
class Glm4vModel(Qwen2_5_VLModel):
1052-
_checkpoint_conversion_mapping = None
1052+
_checkpoint_conversion_mapping = {}
10531053
_no_split_modules = ["Glm4vTextDecoderLayer", "Glm4vVisionBlock"]
10541054

10551055
def __init__(self, config):
@@ -1395,7 +1395,7 @@ class Glm4vCausalLMOutputWithPast(Qwen2_5_VLCausalLMOutputWithPast):
13951395

13961396

13971397
class Glm4vForConditionalGeneration(Qwen2_5_VLForConditionalGeneration):
1398-
_checkpoint_conversion_mapping = None
1398+
_checkpoint_conversion_mapping = {}
13991399

14001400
def forward(
14011401
self,

0 commit comments

Comments
 (0)