-
Notifications
You must be signed in to change notification settings - Fork 75
Expand file tree
/
Copy pathoptimize_image.py
More file actions
76 lines (56 loc) · 2.65 KB
/
optimize_image.py
File metadata and controls
76 lines (56 loc) · 2.65 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
# Copyright (c) Meta Platforms, Inc. and affiliates.
# All rights reserved.
# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.
import os
import tqdm
import torch
import omegaconf
import torchvision
import numpy as np
from PIL import Image
from wmforger.models import build_extractor
transform_image = torchvision.transforms.Compose([
lambda x: x.convert("RGB"),
torchvision.transforms.Resize((768, 768)),
torchvision.transforms.ToTensor(),
lambda x: x.view(1, 3, 768, 768),
])
def get_artifact_discriminator(ckpt_path, device="cuda:0"):
model_type = "convnext_tiny"
state_dict = torch.load(ckpt_path, weights_only=True, map_location="cpu")["model"]
extractor_params = omegaconf.OmegaConf.load("configs/extractor.yaml")[model_type]
model = build_extractor(model_type, extractor_params, img_size=256, nbits=0)
model.load_state_dict(state_dict)
model = model.eval().to(device)
return model
def optimize(img: Image, model, device="cuda:0", num_steps=50, lr=0.05):
img = transform_image(img).to(device)
param = torch.nn.Parameter(torch.zeros_like(img)).to(device)
optim = torch.optim.SGD([param], lr=lr)
for _ in tqdm.tqdm(range(num_steps)):
optim.zero_grad()
loss = -model((img + param).clip(0, 1)).mean()
loss.backward()
optim.step()
return (img + param).clip(0, 1).detach().cpu()
def get_watermark(img: Image, optimized_img: torch.Tensor):
optimized_img = optimized_img.mul(255).round().to(torch.uint8).permute(0, 2, 3, 1).squeeze(0).numpy()
optimized_img = Image.fromarray(optimized_img).resize(img.size, Image.BILINEAR)
watermark = np.array(img).astype(np.float32) - np.array(optimized_img).astype(np.float32)
return optimized_img, watermark
if __name__ == "__main__":
import argparse
parser = argparse.ArgumentParser()
parser.add_argument("--image", type=str, help="Path to the image file", required=True)
parser.add_argument("--ckpt_path", type=str, help="Path to the checkpoint file", required=True)
args = parser.parse_args()
device = "cuda"
model = get_artifact_discriminator(ckpt_path=args.ckpt_path, device=device)
image = Image.open(args.image).convert("RGB")
optimized_img = optimize(image, model, device=device, num_steps=50, lr=0.05)
cleaned_image, watermark = get_watermark(image, optimized_img)
os.makedirs("output", exist_ok=True)
Image.fromarray(np.round(np.abs(watermark * 16)).astype(np.uint8)).save("output/watermark.png")
cleaned_image.save("output/cleaned_image.png")
print("Extracted watermark saved to output/watermark.png")