forked from IDT-ITI/MMFusion-IML
-
Notifications
You must be signed in to change notification settings - Fork 0
/
inference.py
96 lines (72 loc) · 3.2 KB
/
inference.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
import argparse
import numpy as np
from torch.utils.data import DataLoader
import torch
import torchvision.transforms.functional as TF
import logging
import matplotlib.pyplot as plt
from data.datasets import ManipulationDataset
from model.cmnext_conf import CMNeXtWithConf
from model.modal_extract import ModalitiesExtractor
from configs.cmnext_init_cfg import _C as config, update_config
from model.ws_cmnext_conf import WSCMNeXtWithConf
parser = argparse.ArgumentParser(description='Infer')
parser.add_argument('-gpu', '--gpu', type=int, default=-1, help='device, use -1 for cpu')
parser.add_argument('-log', '--log', type=str, default='INFO', help='logging level')
parser.add_argument('-exp', '--exp', type=str, default='experiments/ec_example_phase_earlyfusion.yaml', help='Yaml experiment file')
parser.add_argument('-ckpt', '--ckpt', type=str, default='ckpt/early_fusion_detection.pth', help='Checkpoint')
parser.add_argument('-path', '--path', type=str, default='test/doc_manipsmall2.png', help='Image path')
parser.add_argument('opts', help="other options", default=None, nargs=argparse.REMAINDER)
args = parser.parse_args()
config = update_config(config, args.exp)
loglvl = getattr(logging, args.log.upper())
logging.basicConfig(level=loglvl)
gpu = args.gpu
device = 'cuda:%d' % gpu if gpu >= 0 else 'cpu'
np.set_printoptions(formatter={'float': '{: 7.3f}'.format})
if device != 'cpu':
# cudnn setting
import torch.backends.cudnn as cudnn
cudnn.benchmark = False
cudnn.deterministic = True
cudnn.enabled = config.CUDNN.ENABLED
modal_extractor = ModalitiesExtractor(config.MODEL.MODALS[1:], config.MODEL.NP_WEIGHTS)
if args.ckpt.endswith("early_fusion_detection.pth"):
model = CMNeXtWithConf(config.MODEL)
else:
model = WSCMNeXtWithConf(config.MODEL)
ckpt = torch.load(args.ckpt, map_location=device)
model.load_state_dict(ckpt['state_dict'])
modal_extractor.load_state_dict(ckpt['extractor_state_dict'])
modal_extractor.to(device)
model = model.to(device)
modal_extractor.eval()
model.eval()
target = "./results/" + "_mask.png"
with open('tmp_inf.txt', 'w') as f:
f.write(args.path + ' None 0\n')
val = ManipulationDataset('tmp_inf.txt',
config.DATASET.IMG_SIZE,
train=False)
val_loader = DataLoader(val,
batch_size=1,
shuffle=False,
num_workers=config.WORKERS,
pin_memory=True)
f1 = []
f1th = []
for step, (images, _, masks, lab) in enumerate(val_loader):
with torch.no_grad():
images = images.to(device, non_blocking=True)
masks = masks.squeeze(1).to(device, non_blocking=True)
modals = modal_extractor(images)
images_norm = TF.normalize(images, mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
inp = [images_norm] + modals
anomaly, confidence, detection = model(inp)
gt = masks.squeeze().cpu().numpy()
map = torch.nn.functional.softmax(anomaly, dim=1)[:, 1, :, :].squeeze().cpu().numpy()
det = detection.item()
plt.imsave(target, map, cmap='RdBu_r', vmin=0, vmax=1)
print(f"Ran on {args.path}")
print(f"Detection score: {det}")
print(f"Localization map saved in {target}")