@@ -10,7 +10,7 @@ def reduce_model_config(config: Any) -> Dict[str, Any]:
1010 """Reduces a model size."""
1111 kwargs : Dict [str , Any ] = {}
1212 if hasattr (config , "num_hidden_layers" ):
13- config .num_hidden_layers = min (config .num_hidden_layers , 2 )
13+ config .num_hidden_layers = min (config .num_hidden_layers , 4 )
1414 if hasattr (config , "mm_tokens_per_image" ):
1515 config .mm_tokens_per_image = min (config .mm_tokens_per_image , 2 )
1616 if hasattr (config , "vision_config" ):
@@ -348,7 +348,7 @@ def random_input_kwargs(config: Any) -> Tuple[Dict[str, Any], Callable]:
348348 "vision_config" ,
349349 )
350350 text_config = False
351- check_hasattr (config .vision_config , ("num_channels" , "in_chans" ))
351+ check_hasattr (config .vision_config , ("num_channels" , "in_chans" , "in_channels" ))
352352 kwargs = dict (
353353 batch_size = 2 ,
354354 sequence_length = 43 ,
@@ -421,7 +421,9 @@ def random_input_kwargs(config: Any) -> Tuple[Dict[str, Any], Callable]:
421421 else config .vision_config .image_size
422422 ),
423423 num_channels = (
424- 3 if config is None else _pick (config .vision_config , "num_channels" , "in_chans" )
424+ 3
425+ if config is None
426+ else _pick (config .vision_config , "num_channels" , "in_chans" , "in_channels" )
425427 ),
426428 pad_token_id = (
427429 0
0 commit comments