|
23 | 23 | import re |
24 | 24 | from typing import Any, Callable, Dict, List, Optional, Tuple, Union |
25 | 25 |
|
| 26 | +import cv2 |
26 | 27 | import numpy as np |
27 | 28 | import PIL.Image |
28 | 29 | import torch |
29 | 30 | import torch.nn.functional as F |
30 | 31 | from bert_tokenizer import BasicTokenizer |
31 | | -from text_embedding_module import TextEmbeddingModule |
| 32 | +from embedding_manager import EmbeddingManager |
| 33 | +from frozen_clip_embedder_t3 import FrozenCLIPEmbedderT3 |
| 34 | +from PIL import Image, ImageDraw, ImageFont |
| 35 | +from recognizer import TextRecognizer, create_predictor |
| 36 | +from safetensors.torch import load_file |
| 37 | +from torch import nn |
32 | 38 | from transformers import CLIPImageProcessor, CLIPTextModel, CLIPTokenizer, CLIPVisionModelWithProjection |
33 | 39 |
|
34 | 40 | from diffusers.callbacks import MultiPipelineCallbacks, PipelineCallback |
|
100 | 106 | """ |
101 | 107 |
|
102 | 108 |
|
103 | | -import cv2 |
104 | | -import numpy as np |
105 | | -import torch |
106 | | -from embedding_manager import EmbeddingManager |
107 | | -from frozen_clip_embedder_t3 import FrozenCLIPEmbedderT3 |
108 | | -from PIL import Image, ImageDraw, ImageFont |
109 | | -from recognizer import TextRecognizer, create_predictor |
110 | | -from torch import nn |
111 | | - |
112 | | -from diffusers.utils import ( |
113 | | - logging, |
114 | | -) |
115 | | - |
116 | | - |
117 | | -logger = logging.get_logger(__name__) # pylint: disable=invalid-name |
118 | | - |
119 | | - |
120 | 109 | class TextEmbeddingModule(nn.Module): |
121 | 110 | def __init__(self, font_path, use_fp16=False, device="cpu"): |
122 | 111 | super().__init__() |
@@ -403,21 +392,6 @@ def to(self, *args, **kwargs): |
403 | 392 | return self |
404 | 393 |
|
405 | 394 |
|
406 | | -from typing import Optional |
407 | | - |
408 | | -import cv2 |
409 | | -import numpy as np |
410 | | -import torch |
411 | | -from PIL import ImageFont |
412 | | -from safetensors.torch import load_file |
413 | | -from torch import nn |
414 | | - |
415 | | -from diffusers.utils import logging |
416 | | - |
417 | | - |
418 | | -logger = logging.get_logger(__name__) # pylint: disable=invalid-name |
419 | | - |
420 | | - |
421 | 395 | # Copied from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion_img2img.retrieve_latents |
422 | 396 | def retrieve_latents( |
423 | 397 | encoder_output: torch.Tensor, generator: Optional[torch.Generator] = None, sample_mode: str = "sample" |
@@ -589,7 +563,6 @@ def to(self, device): |
589 | 563 | return self |
590 | 564 |
|
591 | 565 |
|
592 | | - |
593 | 566 | # Copied from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion.retrieve_timesteps |
594 | 567 | def retrieve_timesteps( |
595 | 568 | scheduler, |
|
0 commit comments