-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathchange_semantic.py
67 lines (59 loc) · 2.7 KB
/
change_semantic.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
# To make the VLMs have some hallucinations on non-existing objects
import os
import torch
from surrogates import HuanranTransformerClipAttackVisionModel, HuanranOpenClipAttackVisionModel
from utils import save_image, get_image, get_list_image, save_list_images
from tqdm import tqdm
from attacks import MI_CommonWeakness, SSA_CommonWeakness
from utils.init import forbid_initialization
import argparse
from torchvision import transforms
parser = argparse.ArgumentParser()
parser.add_argument("--target_text", type=str, default=None)
parser.add_argument("--target_img_path", type=str, default=None)
parser.add_argument("--input_dir", type=str)
parser.add_argument("--output_dir", type=str)
args = parser.parse_args()
print(vars(args))
forbid_initialization()
assert args.target_text is not None or args.target_img_path is not None, "Must assign a target text or target image"
# The following codes aim to initialize the models.
# Don't care about this target text. Just for initialization of models.
target_text = args.target_text if args.target_text is not None else "A Bomb."
clip1 = HuanranTransformerClipAttackVisionModel("openai/clip-vit-large-patch14", target_text=target_text)
laion_clip = HuanranOpenClipAttackVisionModel("hf-hub:laion/CLIP-ViT-B-32-laion2B-s34B-b79K", target_text)
laion_clip2 = HuanranOpenClipAttackVisionModel("hf-hub:laion/CLIP-ViT-B-16-laion2B-s34B-b88K", target_text)
laion_clip3 = HuanranOpenClipAttackVisionModel(
"hf-hub:laion/CLIP-convnext_large_d_320.laion2B-s29B-b131K-ft-soup", target_text
)
laion_clip4 = HuanranOpenClipAttackVisionModel("hf-hub:laion/CLIP-ViT-bigG-14-laion2B-39B-b160k", target_text)
sig_clip = HuanranOpenClipAttackVisionModel("hf-hub:timm/ViT-SO400M-14-SigLIP-384", target_text, resolution=(384, 384))
models = [clip1, laion_clip, laion_clip4, sig_clip, laion_clip2, laion_clip3]
class LossPrinter:
def __init__(self):
self.count = 0
def __call__(self, loss, *args):
self.count += 1
if self.count % 100 == 1:
print(loss)
return loss
attacker = SSA_CommonWeakness(
models,
epsilon=16 / 255,
step_size=1 / 255,
total_step=50,
criterion=LossPrinter(),
)
if not os.path.exists(args.output_dir):
os.mkdir(args.output_dir)
images = get_list_image(args.input_dir)
transform = transforms.Resize((224, 224))
images = [transform(i).cuda() for i in images]
for i, image in enumerate(tqdm(images)):
for model in models:
if args.target_text is not None:
model.change_target_text(args.target_text)
else:
model.change_target_image(get_image(args.target_img_path).unsqueeze(0))
adv_x = attacker(image, torch.tensor([0]))
save_image(adv_x, os.path.join(args.output_dir, f"{i}.png"))