diff --git a/surya/model/recognition/processor.py b/surya/model/recognition/processor.py index 5d42ac3a..28c4305a 100644 --- a/surya/model/recognition/processor.py +++ b/surya/model/recognition/processor.py @@ -194,8 +194,9 @@ def align_long_axis( class SuryaProcessor(DonutProcessor): def __init__(self, image_processor=None, tokenizer=None, train=False, **kwargs): - image_processor = SuryaImageProcessor.from_pretrained(settings.RECOGNITION_MODEL_CHECKPOINT) - tokenizer = Byt5LangTokenizer() + # If image_processor is not empty, then use it,same with tokenizer + image_processor = image_processor or SuryaImageProcessor.from_pretrained(settings.RECOGNITION_MODEL_CHECKPOINT) + tokenizer = tokenizer or Byt5LangTokenizer() if image_processor is None: raise ValueError("You need to specify an `image_processor`.") if tokenizer is None: