wbw520
diff --git a/‎configs.py
Lines changed: 8 additions & 6 deletions b/‎configs.py
Lines changed: 8 additions & 6 deletions
diff --git a/‎cpt_compare.py
Lines changed: 119 additions & 0 deletions b/‎cpt_compare.py
Lines changed: 119 additions & 0 deletions
diff --git a/‎draw_graph/ablation.py
Lines changed: 177 additions & 0 deletions b/‎draw_graph/ablation.py
Lines changed: 177 additions & 0 deletions
@@ -4,16 +4,18 @@
 
 import argparse
 parser = argparse.ArgumentParser(description="PyTorch implementation of cpt")
-parser.add_argument('--dataset', type=str, default="CUB200")
+parser.add_argument('--dataset', type=str, default="ImageNet")
 parser.add_argument('--dataset_dir', type=str, default="/media/wbw/a7f02863-b441-49d0-b546-6ef6fefbbc7e")
 parser.add_argument('--output_dir', type=str, default="saved_model")
 # ========================= Model Configs ==========================
-parser.add_argument('--num_classes', default=50, help='category for classification')
-parser.add_argument('--num_cpt', default=50, help='number of the concept')
+parser.add_argument('--num_classes', default=20, help='category for classification')
+parser.add_argument('--num_cpt', default=10, help='number of the concept')
 parser.add_argument('--base_model', default="resnet18", type=str)
 parser.add_argument('--img_size', default=224, help='size for input image')
 parser.add_argument('--pre_train', default=False, type=bool,
                     help='whether pre-train the model')
+parser.add_argument('--aug', default=True, type=bool,
+                    help='whether use augmentation')
 parser.add_argument('--act_type', default="sigmoid", help='the activation for the slot attention')
 parser.add_argument('--num_retrieval', default=50, help='number of the top retrieval images')
 parser.add_argument('--weight_att', default=False, help='using fc weight for att visualization')
@@ -24,10 +26,10 @@
 
 # ========================= Learning Configs ==========================
 parser.add_argument('--start_epoch', default=0, type=int, metavar='N', help='start epoch')
-parser.add_argument('--lr', default=0.0005, type=float)
+parser.add_argument('--lr', default=0.0001, type=float)
 parser.add_argument('--batch_size', default=128, type=int)
-parser.add_argument('--epoch', default=40, type=int)
-parser.add_argument('--lr_drop', default=20, type=float, nargs="+",
+parser.add_argument('--epoch', default=80, type=int)
+parser.add_argument('--lr_drop', default=60, type=float, nargs="+",
                     metavar='LRSteps', help='epochs to decay learning rate by 10')
 # ========================= Machine Configs ==========================
 parser.add_argument('--num_workers', default=4, type=int)
 
@@ -0,0 +1,119 @@
+from torchvision import datasets, transforms
+from model.model_main import MainModel
+from configs import parser
+import torch
+import os
+from PIL import Image
+import numpy as np
+from utils import apply_colormap_on_image
+from loaders.get_loader import load_all_imgs, get_transform
+from tools import for_retrival, attention_estimation
+import h5py
+from draw_tools import draw_bar, draw_plot
+import shutil
+import torch.nn.functional as F
+from tools import crop_center, shot_game
+import cv2
+import copy
+from captum.metrics import infidelity
+
+
+shutil.rmtree('vis/', ignore_errors=True)
+shutil.rmtree('vis_pp/', ignore_errors=True)
+os.makedirs('vis/', exist_ok=True)
+os.makedirs('vis_pp/', exist_ok=True)
+np.set_printoptions(suppress=True)
+
+
+def main():
+    # load all imgs
+    imgs_database, labels_database, imgs_val, labels_val, cat = load_all_imgs(args)
+    print("All category:")
+    print(cat)
+    transform = get_transform(args)["val"]
+
+    # load model and weights
+    model = MainModel(args, vis=True)
+    device = torch.device("cuda:0")
+    model.to(device)
+    name = f"{args.dataset}_{args.base_model}_cls{args.num_classes}_cpt{args.num_cpt}_" + f"{'use_slot_' + args.act_type + '_' + args.cpt_activation if not args.pre_train else 'no_slot'}.pt"
+    print(name)
+    checkpoint = torch.load(os.path.join(args.output_dir, name), map_location="cuda:0")
+    model.load_state_dict(checkpoint, strict=True)
+    model.eval()
+    record = []
+    record_Dauc = []
+
+    for i in range(len(imgs_val)):
+        print(i)
+        model.vis = True
+        data = imgs_val[i]
+        print(data)
+        label = labels_val[i]
+        # print(i)
+        # print(data)
+
+        image_orl = Image.open(data).convert('RGB').resize([256, 256], resample=Image.BILINEAR)
+        if image_orl.mode == 'L':
+            image_orl = image_orl.convert('RGB')
+        image_orl = crop_center(image_orl, 224, 224)
+        imggg = transform(image_orl).unsqueeze(0).to(device)
+        w = model.state_dict()["cls.weight"][label]
+        w2 = w.clone()
+        w2 = torch.relu(w2)
+        cpt, pred, att, update = model(imggg, w2)
+
+        pred = F.softmax(pred, dim=-1)
+        pred_label = torch.argmax(pred).item()
+        if pred_label != label:
+            print("predict error")
+            continue
+
+        # print("------------")
+        # print("The Model Prediction is: ", pred_label)
+        # print("True is", label)
+
+        # for id in range(args.num_cpt):
+        #     slot_image = np.array(Image.open(f'vis/0_slot_{id}.png'), dtype=np.uint8)
+        #     heatmap_only, heatmap_on_image = apply_colormap_on_image(img_orl2, slot_image, 'jet')
+        #     heatmap_on_image.save("vis/" + f'0_slot_mask_{id}.png')
+
+        # slot_image = np.array(Image.open(f'vis/overall.png'), dtype=np.uint8)
+        # heatmap_only, heatmap_on_image = apply_colormap_on_image(img_orl2, slot_image, 'jet')
+        # heatmap_on_image.save("vis/" + f'overall_mask.png')
+        mask = cv2.imread("vis/" + f'overall.png', cv2.IMREAD_UNCHANGED) / 255
+        hitted, segment = shot_game(mask, data)
+        if hitted is None:
+            continue
+        record.append(hitted)
+
+        record_p = [pred[0][pred_label].item()]
+        mask1 = mask.flatten()
+        ids = np.argsort(-mask1, axis=0)
+        model.vis = False
+        for j in range(1, 101, 1):
+            thresh = mask1[ids[j * 501]]
+            mask_use = copy.deepcopy(mask)
+            mask_use[mask_use >= thresh] = 0
+            mask_use[mask_use != 0] = 1
+
+            mask_use = torch.from_numpy(mask_use).to(device, torch.float32)
+            new_img = imggg * mask_use
+            cpt, pred, att, update = model(new_img, None, None)
+            output_c = F.softmax(pred, dim=-1)
+            record_p.append(output_c[0][pred_label].item())
+        record_p = np.array(record_p)
+        record_p = (record_p - np.min(record_p)) / (np.max(record_p) - np.min(record_p))
+        # print(record_p)
+        print(record_p.mean())
+        record_Dauc.append(record_p.mean())
+
+    print(np.mean(np.array(record)))
+    print(record)
+    print(np.mean(np.array(record_Dauc)))
+
+
+if __name__ == '__main__':
+    args = parser.parse_args()
+    args.pre_train = False
+    main()
@@ -0,0 +1,177 @@
+import matplotlib.pyplot as plt
+import numpy as np
+
+
+plt.figure(figsize=(36, 10), dpi=80)
+plt.rcParams['font.family'] = 'serif'
+plt.rcParams['font.serif'] = ['Times New Roman'] + plt.rcParams['font.serif']
+plt.rcParams['axes.linewidth'] = 3
+
+ax1 = plt.subplot(251)
+ax2 = plt.subplot(252)
+ax3 = plt.subplot(253)
+ax4 = plt.subplot(254)
+ax5 = plt.subplot(255)
+
+ax6 = plt.subplot(256)
+ax7 = plt.subplot(257)
+ax8 = plt.subplot(258)
+ax9 = plt.subplot(259)
+ax10 = plt.subplot(2, 5, 10)
+
+linewidth = 5
+font = 30
+
+markers = ['o', 's', '^']
+colors = ['#edb03d', "#4dbeeb", "#77ac41"]
+index = [0, 1, 2, 3, 4]
+index3 = [0, 1, 2, 3, 4]
+x_cpt_mnist = ["5", "10", "20", "50", "100"]
+x_cpt_bird = ["20", "50", "100", "200", "300"]
+x_1 = [0, 0.1, 1, 2, 5]
+x_2 = [0, 0.1, 1, 5, 10]
+x_3 = [0, 0.1, 1, 5, 10]
+x_4 = [0, 0.1, 1, 2, 5]
+
+ax1.set_xticks(index)
+ax1.set_xticklabels(x_cpt_mnist)
+ax2.set_xticks(index)
+ax2.set_xticklabels(x_1)
+ax3.set_xticks(index)
+ax3.set_xticklabels(x_2)
+ax4.set_xticks(index)
+ax4.set_xticklabels(x_3)
+ax5.set_xticks(index3)
+ax5.set_xticklabels(x_4)
+acc_1 = [0.857, 0.922, 0.962, 0.995, 0.992]
+inter_1 = [0.732, 0.791, 0.930, 0.965, 0.988]
+exter_1 = [0.531, 0.513, 0.618, 0.906, 0.960]
+
+acc_2 = [0.940, 0.962, 0.922, 0.886, 0.780]
+inter_2 = [0.921, 0.930, 0.930, 0.938, 0.889]
+exter_2 = [0.731, 0.723, 0.718, 0.736, 0.849]
+
+acc_3 = [0.960, 0.956, 0.962, 0.955, 0.963]
+inter_3 = [0.930, 0.926, 0.930, 0.945, 0.970]
+exter_3 = [0.711, 0.710, 0.718, 0.715, 0.789]
+
+acc_4 = [0.957, 0.967, 0.962, 0.948, 0.900]
+inter_4 = [0.931, 0.935, 0.930, 0.938, 0.949]
+exter_4 = [0.719, 0.713, 0.718, 0.716, 0.700]
+
+acc_5 = [0.927, 0.949, 0.962, 0.948, 0.952]
+inter_5 = [0.981, 0.935, 0.930, 0.948, 0.949]
+exter_5 = [0.979, 0.923, 0.718, 0.746, 0.750]
+
+ax6.set_xticks(index)
+ax6.set_xticklabels(x_cpt_bird)
+ax7.set_xticks(index)
+ax7.set_xticklabels(x_1)
+ax8.set_xticks(index)
+ax8.set_xticklabels(x_2)
+ax9.set_xticks(index)
+ax9.set_xticklabels(x_3)
+ax10.set_xticks(index3)
+ax10.set_xticklabels(x_4)
+
+acc_6 = [0.566, 0.668, 0.675, 0.680, 0.676]
+inter_6 = [0.702, 0.850, 0.930, 0.961, 0.965]
+exter_6 = [0.631, 0.353, 0.245, 0.248, 0.361]
+
+acc_7 = [0.650, 0.668, 0.642, 0.588, 0.128]
+inter_7 = [0.752, 0.850, 0.880, 0.810, 0.402]
+exter_7 = [0.601, 0.353, 0.332, 0.371, 0.853]
+
+acc_8 = [0.704, 0.685, 0.668, 0.662, 0.634]
+inter_8 = [0.652, 0.812, 0.850, 0.921, 0.960]
+exter_8 = [0.381, 0.373, 0.345, 0.398, 0.401]
+
+acc_9 = [0.620, 0.656, 0.668, 0.660, 0.652]
+inter_9 = [0.812, 0.823, 0.850, 0.881, 0.880]
+exter_9 = [0.671, 0.583, 0.345, 0.298, 0.291]
+
+acc_10 = [0.670, 0.656, 0.668, 0.660, 0.652]
+inter_10 = [0.782, 0.799, 0.890, 0.891, 0.900]
+exter_10 = [0.361, 0.343, 0.265, 0.268, 0.261]
+
+ax1.axis(ymin=0, ymax=1)
+ax2.axis(ymin=0, ymax=1)
+ax3.axis(ymin=0, ymax=1)
+ax4.axis(ymin=0, ymax=1)
+ax5.axis(ymin=0, ymax=1)
+ax1.set_yticks(np.linspace(0, 1, 2, endpoint=True))
+ax2.set_yticks([])
+ax3.set_yticks([])
+ax4.set_yticks([])
+ax5.set_yticks([])
+
+ax6.axis(ymin=0, ymax=1)
+ax7.axis(ymin=0, ymax=1)
+ax8.axis(ymin=0, ymax=1)
+ax9.axis(ymin=0, ymax=1)
+ax10.axis(ymin=0, ymax=1)
+ax6.set_yticks(np.linspace(0, 1, 2, endpoint=True))
+ax7.set_yticks([])
+ax8.set_yticks([])
+ax9.set_yticks([])
+ax10.set_yticks([])
+
+ax1.tick_params(labelsize=font+5)
+ax2.tick_params(labelsize=font+5)
+ax3.tick_params(labelsize=font+5)
+ax4.tick_params(labelsize=font+5)
+ax5.tick_params(labelsize=font+5)
+ax6.tick_params(labelsize=font+5)
+ax7.tick_params(labelsize=font+5)
+ax8.tick_params(labelsize=font+5)
+ax9.tick_params(labelsize=font+5)
+ax10.tick_params(labelsize=font+5)
+
+
+size_1 = 10
+
+ax1.set_ylabel("MNIST", fontsize=font+size_1)
+ax6.set_ylabel("CUB200", fontsize=font+size_1)
+ax6.set_xlabel("k", fontsize=font+size_1+5)
+ax7.set_xlabel("$\lambda_{qua}$", fontsize=font+size_1)
+ax8.set_xlabel("$\lambda_{con}$", fontsize=font+size_1)
+ax9.set_xlabel("$\lambda_{dis}$", fontsize=font+size_1)
+ax10.set_xlabel("$\lambda_R$", fontsize=font+size_1)
+
+ax1.plot(index, acc_1, marker=markers[0], markevery=1, markersize=15, color=colors[0], linewidth=linewidth, linestyle="-")
+ax1.plot(index, inter_1, marker=markers[1], markevery=1, markersize=15, color=colors[1], linewidth=linewidth, linestyle="-")
+ax1.plot(index, exter_1, marker=markers[2], markevery=1, markersize=15, color=colors[2], linewidth=linewidth, linestyle="-")
+ax2.plot(index, acc_2, marker=markers[0], markevery=1, markersize=15, color=colors[0], linewidth=linewidth, linestyle="-")
+ax2.plot(index, inter_2, marker=markers[1], markevery=1, markersize=15, color=colors[1], linewidth=linewidth, linestyle="-")
+ax2.plot(index, exter_2, marker=markers[2], markevery=1, markersize=15, color=colors[2], linewidth=linewidth, linestyle="-")
+ax3.plot(index, acc_3, marker=markers[0], markevery=1, markersize=15, color=colors[0], linewidth=linewidth, linestyle="-")
+ax3.plot(index, inter_3, marker=markers[1], markevery=1, markersize=15, color=colors[1], linewidth=linewidth, linestyle="-")
+ax3.plot(index, exter_3, marker=markers[2], markevery=1, markersize=15, color=colors[2], linewidth=linewidth, linestyle="-")
+ax4.plot(index, acc_4, marker=markers[0], markevery=1, markersize=15, color=colors[0], linewidth=linewidth, linestyle="-")
+ax4.plot(index, inter_4, marker=markers[1], markevery=1, markersize=15, color=colors[1], linewidth=linewidth, linestyle="-")
+ax4.plot(index, exter_4, marker=markers[2], markevery=1, markersize=15, color=colors[2], linewidth=linewidth, linestyle="-")
+ax5.plot(index, acc_5, marker=markers[0], markevery=1, markersize=15, color=colors[0], linewidth=linewidth, linestyle="-")
+ax5.plot(index, inter_5, marker=markers[1], markevery=1, markersize=15, color=colors[1], linewidth=linewidth, linestyle="-")
+ax5.plot(index, exter_5, marker=markers[2], markevery=1, markersize=15, color=colors[2], linewidth=linewidth, linestyle="-")
+
+
+ax6.plot(index, acc_6, marker=markers[0], markevery=1, markersize=15, color=colors[0], linewidth=linewidth, linestyle="-")
+ax6.plot(index, inter_6, marker=markers[1], markevery=1, markersize=15, color=colors[1], linewidth=linewidth, linestyle="-")
+ax6.plot(index, exter_6, marker=markers[2], markevery=1, markersize=15, color=colors[2], linewidth=linewidth, linestyle="-")
+ax7.plot(index, acc_7, marker=markers[0], markevery=1, markersize=15, color=colors[0], linewidth=linewidth, linestyle="-")
+ax7.plot(index, inter_7, marker=markers[1], markevery=1, markersize=15, color=colors[1], linewidth=linewidth, linestyle="-")
+ax7.plot(index, exter_7, marker=markers[2], markevery=1, markersize=15, color=colors[2], linewidth=linewidth, linestyle="-")
+ax8.plot(index, acc_8, marker=markers[0], markevery=1, markersize=15, color=colors[0], linewidth=linewidth, linestyle="-")
+ax8.plot(index, inter_8, marker=markers[1], markevery=1, markersize=15, color=colors[1], linewidth=linewidth, linestyle="-")
+ax8.plot(index, exter_8, marker=markers[2], markevery=1, markersize=15, color=colors[2], linewidth=linewidth, linestyle="-")
+ax9.plot(index, acc_9, marker=markers[0], markevery=1, markersize=15, color=colors[0], linewidth=linewidth, linestyle="-")
+ax9.plot(index, inter_9, marker=markers[1], markevery=1, markersize=15, color=colors[1], linewidth=linewidth, linestyle="-")
+ax9.plot(index, exter_9, marker=markers[2], markevery=1, markersize=15, color=colors[2], linewidth=linewidth, linestyle="-")
+ax10.plot(index, acc_10, marker=markers[0], markevery=1, markersize=15, color=colors[0], linewidth=linewidth, linestyle="-")
+ax10.plot(index, inter_10, marker=markers[1], markevery=1, markersize=15, color=colors[1], linewidth=linewidth, linestyle="-")
+ax10.plot(index, exter_10, marker=markers[2], markevery=1, markersize=15, color=colors[2], linewidth=linewidth, linestyle="-")
+
+
+plt.tight_layout()
+plt.savefig("ablation.pdf")
+plt.show()