@@ -84,13 +84,13 @@ def test_get_num_tokens_per_image(model_key, multimodal_model_configs):
8484 if model_type == 'llava_next' :
8585 input_processor = LlavaNextInputProcessor (
8686 model_path = encoder_model_dir ,
87- model_config = model_config_dict ,
87+ config = model_config_dict ,
8888 tokenizer = tokenizer ,
8989 trust_remote_code = True )
9090 elif model_type == 'qwen2_5_vl' :
9191 input_processor = Qwen2VLInputProcessorBase (
9292 model_path = encoder_model_dir ,
93- model_config = model_config_dict ,
93+ config = model_config_dict ,
9494 tokenizer = tokenizer ,
9595 trust_remote_code = True )
9696 else :
@@ -191,13 +191,13 @@ def test_get_num_tokens_per_video(model_key, multimodal_model_configs):
191191 if model_type == 'llava_next' :
192192 input_processor = LlavaNextInputProcessor (
193193 model_path = encoder_model_dir ,
194- model_config = model_config_dict ,
194+ config = model_config_dict ,
195195 tokenizer = tokenizer ,
196196 trust_remote_code = True )
197197 elif model_type == 'qwen2_5_vl' :
198198 input_processor = Qwen2VLInputProcessorBase (
199199 model_path = encoder_model_dir ,
200- model_config = model_config_dict ,
200+ config = model_config_dict ,
201201 tokenizer = tokenizer ,
202202 trust_remote_code = True )
203203 else :
0 commit comments