wbw520
diff --git a/‎README.md
+5-5 b/‎README.md
+5-5
diff --git a/‎configs.py
+9-9 b/‎configs.py
+9-9
diff --git a/‎loaders/get_loader.py
+3-3 b/‎loaders/get_loader.py
+3-3
diff --git a/‎main_retri.py ‎main_contrast.py
+1-1 b/‎main_retri.py ‎main_contrast.py
+1-1
diff --git a/‎ACE.py ‎model/ACE.py
+2-2 b/‎ACE.py ‎model/ACE.py
+2-2
diff --git a/‎kmeans.py ‎model/kmeans.py
+2-3 b/‎kmeans.py ‎model/kmeans.py
+2-3
diff --git a/‎model/protopnet.py
+243 b/‎model/protopnet.py
+243
@@ -20,19 +20,19 @@ Using the following command for training
 ```
 python main_recon.py --num_classes 10 --num_cpt 20 --lr 0.001 --epoch 50 --lr_drop 30
 ```
-Use the following command for the inference of a sample. You can change the index to select different input samples. Change deactivate (deactivate one concept, 1 to num_class) and see the changes of reconstruction. Change top-sample (top-10 in the paper) to show more details for a concept. Visualization for the input sample and all concepts are shown at folder "vis" and "vis_pp", respectively. 
+Use the following command for the inference of a sample. You can change the index to select different input samples. Change top-sample (top-10 in the paper) to show more details for a concept. Visualization for the input sample and all concepts are shown at folder "vis" and "vis_pp", respectively. 
 ```
-python vis_recon.py --num_classes 10 --num_cpt 20 --index 0 --top_sample 10 ---deactivate -1
+python vis_recon.py --num_classes 10 --num_cpt 20 --index 0 --top_sample 20 ---deactivate -1
 ```
 
 #### Usage for CUB200, ImageNet, Synthetic (matplot) and Custom
 We first pre-train the backbone and then train the whole model. For ImageNet, Synthetic (matplot) and Custom, just change the name for dataset.
 ```
 Pre-training of backbone:
-python main_retri.py --num_classes 50 --num_cpt 20 --base_model resnet18 --lr 0.0005 --epoch 60 --lr_drop 40 --pre_train True --dataset CUB200 --dataset_dir "your dir"
+python main_contrast.py --num_classes 50 --num_cpt 20 --base_model resnet18 --lr 0.0005 --epoch 60 --lr_drop 40 --pre_train True --dataset CUB200 --dataset_dir "your dir"
 
 Training for BotCL:
-python main_retri.py --num_classes 50 --num_cpt 20 --base_model resnet18 --lr 0.0005 --epoch 60 --lr_drop 40 --dataset CUB200 --dataset_dir "your dir" --weak_supervision_bias 0.1 --quantity_bias 0.1 --distinctiveness_bias 0.01 --consistence_bias 0.05
+python main_contrast.py --num_classes 50 --num_cpt 20 --base_model resnet18 --lr 0.0005 --epoch 60 --lr_drop 40 --dataset CUB200 --dataset_dir "your dir" --weak_supervision_bias 0.1 --quantity_bias 0.1 --distinctiveness_bias 0.05 --consistence_bias 0.01
 ```
 
 Use the following commend to visualize the learned concept.
@@ -42,5 +42,5 @@ First run process.py to extarct the activation for all dataset samples:
 python process.py
 
 Then see the generated concepts by:
-python vis_retri.py --num_classes 50 --num_cpt 20 --base_model resnet18 --index 300 --top_sample 10 --dataset CUB200
+python vis_contrast.py --num_classes 50 --num_cpt 20 --base_model resnet18 --index 300 --top_sample 20 --dataset CUB200
 ```
@@ -2,8 +2,8 @@
 
 import argparse
 parser = argparse.ArgumentParser(description="PyTorch implementation of cpt")
-parser.add_argument('--dataset', type=str, default="ImageNet")
-parser.add_argument('--dataset_dir', type=str, default="/home/wangbowen/DATA")
+parser.add_argument('--dataset', type=str, default="imagenet")
+parser.add_argument('--dataset_dir', type=str, default="/data/li")
 parser.add_argument('--output_dir', type=str, default="saved_model")
 # ========================= Model Configs ==========================
 parser.add_argument('--num_classes', default=50, type=int, help='category for classification')
@@ -20,24 +20,24 @@
 parser.add_argument('--layer', default=1, help='layers for fc, default as one')
 # ========================= Training Configs ==========================
 parser.add_argument('--weak_supervision_bias', type=float, default=0.1, help='weight fot the weak supervision branch')
-parser.add_argument('--att_bias', type=float, default=0.5, help='used to prevent overflow, default as 0.1')
+parser.add_argument('--att_bias', type=float, default=0.1, help='used to prevent overflow, default as 0.1')
 parser.add_argument('--quantity_bias', type=float, default=0.1, help='force each concept to be binary')
-parser.add_argument('--distinctiveness_bias', type=float, default=0.1, help='refer to paper')
+parser.add_argument('--distinctiveness_bias', type=float, default=0.01, help='refer to paper')
 parser.add_argument('--consistence_bias', type=float, default=0.05, help='refer to paper')
 # ========================= Learning Configs ==========================
 parser.add_argument('--start_epoch', default=0, type=int, metavar='N', help='start epoch')
-parser.add_argument('--lr', default=0.0001, type=float)
+parser.add_argument('--lr', default=0.0005, type=float)
 parser.add_argument('--batch_size', default=256, type=int)
-parser.add_argument('--epoch', default=200, type=int)
-parser.add_argument('--lr_drop', default=160, type=float, nargs="+",
+parser.add_argument('--epoch', default=40, type=int)
+parser.add_argument('--lr_drop', default=30, type=float, nargs="+",
                     metavar='LRSteps', help='epochs to decay learning rate by 10')
 # ========================= Machine Configs ==========================
 parser.add_argument('--num_workers', default=4, type=int)
-parser.add_argument('--device', default='cuda:2', help='device to use for training / testing')
+parser.add_argument('--device', default='cuda:0', help='device to use for training / testing')
 # ========================= Demo Configs ==========================
 parser.add_argument('--index', default=0, type=int)
 parser.add_argument('--use_weight', default=False, help='whether use fc weight for the generation of attention mask')
-parser.add_argument('--top_samples', default=50, type=int, help='top n activated samples')
+parser.add_argument('--top_samples', default=20, type=int, help='top n activated samples')
 # parser.add_argument('--demo_cls', default="n01498041", type=str)
 parser.add_argument('--fre', default=1, type=int, help='frequent of show results during training')
 parser.add_argument('--deactivate', default=-1, type=int, help='the index of concept to be deativated')
 
@@ -62,7 +62,7 @@ def get_transform(args):
         transform = transforms.Compose([transforms.Resize([args.img_size, args.img_size]), transforms.ToTensor(),
                                         transforms.Normalize([0.5071, 0.4867, 0.4408], [0.2675, 0.2565, 0.2761])])
         return {"train": transform, "val": transform}
-    elif args.dataset == "CUB200" or args.dataset == "ImageNet":
+    elif args.dataset == "CUB200" or args.dataset == "ImageNet" or args.dataset == "imagenet":
         transform_train = get_train_transformations(args, [[0.485, 0.456, 0.406], [0.229, 0.224, 0.225]])
         transform_val = get_val_transformations(args, [[0.485, 0.456, 0.406], [0.229, 0.224, 0.225]])
         return {"train": transform_train, "val": transform_val}
@@ -91,7 +91,7 @@ def select_dataset(args, transform):
         dataset_train = CUB_200(args, train=True, transform=transform["train"])
         dataset_val = CUB_200(args, train=False, transform=transform["val"])
         return dataset_train, dataset_val
-    elif args.dataset == "ImageNet":
+    elif args.dataset == "ImageNet" or args.dataset == "imagenet":
         dataset_train = ImageNet(args, "train", transform=transform["train"])
         dataset_val = ImageNet(args, "val", transform=transform["val"])
         return dataset_train, dataset_val
@@ -154,7 +154,7 @@ def filter(data):
         val_imgs = datasets.CIFAR10('./data/cifar10', train=False, download=True, transform=None).data
         val_labels = datasets.CIFAR10('./data/cifar10', train=False, download=True, transform=None).targets
         return train_imgs, train_labels, val_imgs, val_labels, cat
-    elif args.dataset == "ImageNet" or args.dataset == "Custom":
+    elif args.dataset == "ImageNet" or args.dataset == "imagenet" or args.dataset == "Custom":
         train = ImageNet(args, "train", transform=None).train
         val = ImageNet(args, "train", transform=None).val
         cat = ImageNet(args, "train", transform=None).category
 
@@ -60,7 +60,7 @@ def main():
             print("get better result, save current model.")
             torch.save(model.state_dict(), os.path.join(args.output_dir,
                 f"{args.dataset}_{args.base_model}_cls{args.num_classes}_" + f"cpt{args.num_cpt if not args.pre_train else ''}_" +
-                f"{'use_slot_' + args.cpt_activation if not args.pre_train else 'no_slot'}.pt"))
+                f"{'use_slot_' + args.cpt_activation if not args.pre_train else 'no_slot'}3.pt"))
 
 
 if __name__ == '__main__':
 
@@ -12,7 +12,7 @@
 import shutil
 # from draws.draw_synthetic import draw_syn
 import torch
-from quantitative_eval import make_statistic
+from utils.quantitative_eval import make_statistic
 import json
 from model.retrieval.model_main import MainModel
 
@@ -268,7 +268,7 @@ def cal_ace(self):
     args.device = "cuda:1"
     device = torch.device(args.device)
     model_.to(device)
-    args.output_dir = "saved_model"
+    args.output_dir = "../saved_model"
     checkpoint = torch.load(os.path.join(args.output_dir,
             f"{args.dataset}_{args.base_model}_cls{args.num_classes}_cpt_no_slot.pt"), map_location=device)
     model_.load_state_dict(checkpoint, strict=True)
 
@@ -8,9 +8,8 @@
 import torch
 import json
 from sklearn.manifold import TSNE
-from quantitative_eval import make_statistic
+from utils.quantitative_eval import make_statistic
 from loaders.ImageNet import get_name
-import sklearn.metrics.pairwise as metrics
 from sklearn.decomposition import PCA
 from model.retrieval.model_main import MainModel
 import cv2
@@ -210,7 +209,7 @@ def draw(data, labels):
     args.device = "cuda:2"
     device = torch.device(args.device)
     model_.to(device)
-    args.output_dir = "saved_model"
+    args.output_dir = "../saved_model"
     checkpoint = torch.load(os.path.join(args.output_dir,
                                                  f"{args.dataset}_{args.base_model}_cls{args.num_classes}_cpt_no_slot.pt"),
                                     map_location=device)
 
@@ -0,0 +1,243 @@
+import torch
+import torch.nn as nn
+import torch.utils.model_zoo as model_zoo
+import torch.nn.functional as F
+
+
+class PPNet(nn.Module):
+
+    def __init__(self, features, img_size, prototype_shape,
+                 num_classes, init_weights=True,
+                 prototype_activation_function='log',
+                 add_on_layers_type='bottleneck'):
+
+        super(PPNet, self).__init__()
+        self.img_size = img_size
+        self.prototype_shape = prototype_shape
+        self.num_prototypes = prototype_shape[0]
+        self.num_classes = num_classes
+        self.epsilon = 1e-4
+
+        # prototype_activation_function could be 'log', 'linear',
+        # or a generic function that converts distance to similarity score
+        self.prototype_activation_function = prototype_activation_function
+
+        '''
+        Here we are initializing the class identities of the prototypes
+        Without domain specific knowledge we allocate the same number of
+        prototypes for each class
+        '''
+        assert (self.num_prototypes % self.num_classes == 0)
+        # a onehot indication matrix for each prototype's class identity
+        self.prototype_class_identity = torch.zeros(self.num_prototypes,
+                                                    self.num_classes)
+
+        num_prototypes_per_class = self.num_prototypes // self.num_classes
+        for j in range(self.num_prototypes):
+            self.prototype_class_identity[j, j // num_prototypes_per_class] = 1
+
+        # this has to be named features to allow the precise loading
+        self.features = features
+
+        if add_on_layers_type == 'bottleneck':
+            add_on_layers = []
+            current_in_channels = 512
+            while (current_in_channels > self.prototype_shape[1]) or (len(add_on_layers) == 0):
+                current_out_channels = max(self.prototype_shape[1], (current_in_channels // 2))
+                add_on_layers.append(nn.Conv2d(in_channels=current_in_channels,
+                                               out_channels=current_out_channels,
+                                               kernel_size=1))
+                add_on_layers.append(nn.ReLU())
+                add_on_layers.append(nn.Conv2d(in_channels=current_out_channels,
+                                               out_channels=current_out_channels,
+                                               kernel_size=1))
+                if current_out_channels > self.prototype_shape[1]:
+                    add_on_layers.append(nn.ReLU())
+                else:
+                    assert (current_out_channels == self.prototype_shape[1])
+                    add_on_layers.append(nn.Sigmoid())
+                current_in_channels = current_in_channels // 2
+            self.add_on_layers = nn.Sequential(*add_on_layers)
+        else:
+            self.add_on_layers = nn.Sequential(
+                nn.Conv2d(in_channels=512, out_channels=self.prototype_shape[1],
+                          kernel_size=1),
+                nn.ReLU(),
+                nn.Conv2d(in_channels=self.prototype_shape[1], out_channels=self.prototype_shape[1], kernel_size=1),
+                nn.Sigmoid()
+            )
+
+        self.prototype_vectors = nn.Parameter(torch.rand(self.prototype_shape),
+                                              requires_grad=True)
+
+        # do not make this just a tensor,
+        # since it will not be moved automatically to gpu
+        self.ones = nn.Parameter(torch.ones(self.prototype_shape),
+                                 requires_grad=False)
+
+        self.last_layer = nn.Linear(self.num_prototypes, self.num_classes,
+                                    bias=False)  # do not use bias
+
+        if init_weights:
+            self._initialize_weights()
+
+    def conv_features(self, x):
+        '''
+        the feature input to prototype layer
+        '''
+        x = self.features(x)
+        x = self.add_on_layers(x)
+        return x
+
+    @staticmethod
+    def _weighted_l2_convolution(input, filter, weights):
+        '''
+        input of shape N * c * h * w
+        filter of shape P * c * h1 * w1
+        weight of shape P * c * h1 * w1
+        '''
+        input2 = input ** 2
+        input_patch_weighted_norm2 = F.conv2d(input=input2, weight=weights)
+
+        filter2 = filter ** 2
+        weighted_filter2 = filter2 * weights
+        filter_weighted_norm2 = torch.sum(weighted_filter2, dim=(1, 2, 3))
+        filter_weighted_norm2_reshape = filter_weighted_norm2.view(-1, 1, 1)
+
+        weighted_filter = filter * weights
+        weighted_inner_product = F.conv2d(input=input, weight=weighted_filter)
+
+        # use broadcast
+        intermediate_result = \
+            - 2 * weighted_inner_product + filter_weighted_norm2_reshape
+        # x2_patch_sum and intermediate_result are of the same shape
+        distances = F.relu(input_patch_weighted_norm2 + intermediate_result)
+
+        return distances
+
+    def _l2_convolution(self, x):
+        '''
+        apply self.prototype_vectors as l2-convolution filters on input x
+        '''
+        x2 = x ** 2
+        x2_patch_sum = F.conv2d(input=x2, weight=self.ones)
+
+        p2 = self.prototype_vectors ** 2
+        p2 = torch.sum(p2, dim=(1, 2, 3))
+        # p2 is a vector of shape (num_prototypes,)
+        # then we reshape it to (num_prototypes, 1, 1)
+        p2_reshape = p2.view(-1, 1, 1)
+
+        xp = F.conv2d(input=x, weight=self.prototype_vectors)
+        intermediate_result = - 2 * xp + p2_reshape  # use broadcast
+        # x2_patch_sum and intermediate_result are of the same shape
+        distances = F.relu(x2_patch_sum + intermediate_result)
+
+        return distances
+
+    def prototype_distances(self, x):
+        '''
+        x is the raw input
+        '''
+        conv_features = self.conv_features(x)
+        distances = self._l2_convolution(conv_features)
+        return distances
+
+    def distance_2_similarity(self, distances):
+        if self.prototype_activation_function == 'log':
+            return torch.log((distances + 1) / (distances + self.epsilon))
+        elif self.prototype_activation_function == 'linear':
+            return -distances
+        else:
+            return self.prototype_activation_function(distances)
+
+    def forward(self, x):
+        distances = self.prototype_distances(x)
+        '''
+        we cannot refactor the lines below for similarity scores
+        because we need to return min_distances
+        '''
+        # global min pooling
+        min_distances = -F.max_pool2d(-distances,
+                                      kernel_size=(distances.size()[2],
+                                                   distances.size()[3]))
+        min_distances = min_distances.view(-1, self.num_prototypes)
+        prototype_activations = self.distance_2_similarity(min_distances)
+        logits = self.last_layer(prototype_activations)
+        return logits, min_distances
+
+    def push_forward(self, x):
+        '''this method is needed for the pushing operation'''
+        conv_output = self.conv_features(x)
+        distances = self._l2_convolution(conv_output)
+        return conv_output, distances
+
+    def prune_prototypes(self, prototypes_to_prune):
+        '''
+        prototypes_to_prune: a list of indices each in
+        [0, current number of prototypes - 1] that indicates the prototypes to
+        be removed
+        '''
+        prototypes_to_keep = list(set(range(self.num_prototypes)) - set(prototypes_to_prune))
+
+        self.prototype_vectors = nn.Parameter(self.prototype_vectors.data[prototypes_to_keep, ...],
+                                              requires_grad=True)
+
+        self.prototype_shape = list(self.prototype_vectors.size())
+        self.num_prototypes = self.prototype_shape[0]
+
+        # changing self.last_layer in place
+        # changing in_features and out_features make sure the numbers are consistent
+        self.last_layer.in_features = self.num_prototypes
+        self.last_layer.out_features = self.num_classes
+        self.last_layer.weight.data = self.last_layer.weight.data[:, prototypes_to_keep]
+
+        # self.ones is nn.Parameter
+        self.ones = nn.Parameter(self.ones.data[prototypes_to_keep, ...],
+                                 requires_grad=False)
+        # self.prototype_class_identity is torch tensor
+        # so it does not need .data access for value update
+        self.prototype_class_identity = self.prototype_class_identity[prototypes_to_keep, :]
+
+    def set_last_layer_incorrect_connection(self, incorrect_strength):
+        '''
+        the incorrect strength will be actual strength if -0.5 then input -0.5
+        '''
+        positive_one_weights_locations = torch.t(self.prototype_class_identity)
+        negative_one_weights_locations = 1 - positive_one_weights_locations
+
+        correct_class_connection = 1
+        incorrect_class_connection = incorrect_strength
+        self.last_layer.weight.data.copy_(
+            correct_class_connection * positive_one_weights_locations
+            + incorrect_class_connection * negative_one_weights_locations)
+
+    def _initialize_weights(self):
+        for m in self.add_on_layers.modules():
+            if isinstance(m, nn.Conv2d):
+                # every init technique has an underscore _ in the name
+                nn.init.kaiming_normal_(m.weight, mode='fan_out', nonlinearity='relu')
+
+                if m.bias is not None:
+                    nn.init.constant_(m.bias, 0)
+
+            elif isinstance(m, nn.BatchNorm2d):
+                nn.init.constant_(m.weight, 1)
+                nn.init.constant_(m.bias, 0)
+
+        self.set_last_layer_incorrect_connection(incorrect_strength=-0.5)
+
+
+def construct_PPNet(bone, img_size=224,
+                    prototype_shape=(1500, 512, 1, 1), num_classes=15,
+                    prototype_activation_function='log',
+                    add_on_layers_type='bottleneck'):
+    features = bone
+
+    return PPNet(features=features,
+                 img_size=img_size,
+                 prototype_shape=prototype_shape,
+                 num_classes=num_classes,
+                 init_weights=True,
+                 prototype_activation_function=prototype_activation_function,
+                 add_on_layers_type=add_on_layers_type)