Added support for 5-shot

gitabcworld · gitabcworld · commit 0eb4d4b423ff · 2017-08-29T08:48:34.000+02:00
diff --git a/datasets/miniImagenetOneShot.py b/datasets/miniImagenetOneShot.py
@@ -32,7 +32,7 @@ def __init__(self, dataroot = '/home/aberenguel/Dataset/miniImagenet', type = 't
         self.classes_per_set = classes_per_set
         self.samples_per_class = samples_per_class
         self.n_samples = self.samples_per_class * self.classes_per_set
-        self.n_samplesNShot = 1 # Samples per meta-test. In this case 1 as is OneShot.
+        self.n_samplesNShot = 5 # Samples per meta-test. In this case 1 as is OneShot.
         # Transformations to the image
         self.transform = transforms.Compose([filenameToPILImage,
                                              PiLImageResize,
diff --git a/datasets/omniglotNShot.py b/datasets/omniglotNShot.py
@@ -84,15 +84,15 @@ def normalization(self):
         self.max = np.max(self.x_train)
         self.min = np.min(self.x_train)
         print("train_shape", self.x_train.shape, "test_shape", self.x_test.shape, "val_shape", self.x_val.shape)
-        print("before_normalization", "mean", self.mean, "max", self.max, "min", self.min, "std", self.std)
+        #print("before_normalization", "mean", self.mean, "max", self.max, "min", self.min, "std", self.std)
         self.x_train = (self.x_train - self.mean) / self.std
         self.x_val = (self.x_val - self.mean) / self.std
         self.x_test = (self.x_test - self.mean) / self.std
-        self.mean = np.mean(self.x_train)
-        self.std = np.std(self.x_train)
-        self.max = np.max(self.x_train)
-        self.min = np.min(self.x_train)
-        print("after_normalization", "mean", self.mean, "max", self.max, "min", self.min, "std", self.std)
+        #self.mean = np.mean(self.x_train)
+        #self.std = np.std(self.x_train)
+        #self.max = np.max(self.x_train)
+        #self.min = np.min(self.x_train)
+        #print("after_normalization", "mean", self.mean, "max", self.max, "min", self.min, "std", self.std)
 
     def load_data_cache(self, data_pack):
         """
@@ -105,22 +105,34 @@ def load_data_cache(self, data_pack):
         for sample in range(1000):
             support_set_x = np.zeros((self.batch_size, n_samples, 28, 28, 1))
             support_set_y = np.zeros((self.batch_size, n_samples))
-            target_x = np.zeros((self.batch_size, 28, 28, 1), dtype=np.int)
-            target_y = np.zeros((self.batch_size,), dtype=np.int)
+            target_x = np.zeros((self.batch_size, self.samples_per_class, 28, 28, 1), dtype=np.int)
+            target_y = np.zeros((self.batch_size, self.samples_per_class), dtype=np.int)
             for i in range(self.batch_size):
-                ind = 0
                 pinds = np.random.permutation(n_samples)
                 classes = np.random.choice(data_pack.shape[0], self.classes_per_set, False)
-                x_hat_class = np.random.randint(self.classes_per_set)
+                # select 1-shot or 5-shot classes for test with repetition
+                x_hat_class = np.random.choice(classes, self.samples_per_class, True)
+                pinds_test = np.random.permutation(self.samples_per_class)
+                ind = 0
+                ind_test = 0
                 for j, cur_class in enumerate(classes):  # each class
-                    example_inds = np.random.choice(data_pack.shape[1], self.samples_per_class, False)
-                    for eind in example_inds:
+                    if cur_class in x_hat_class:
+                        # Count number of times this class is inside the meta-test
+                        n_test_samples = np.sum(cur_class == x_hat_class)
+                        example_inds = np.random.choice(data_pack.shape[1], self.samples_per_class + n_test_samples, False)
+                    else:
+                        example_inds = np.random.choice(data_pack.shape[1], self.samples_per_class, False)
+
+                    # meta-training
+                    for eind in example_inds[:self.samples_per_class]:
                         support_set_x[i, pinds[ind], :, :, :] = data_pack[cur_class][eind]
                         support_set_y[i, pinds[ind]] = j
-                        ind += 1
-                    if j == x_hat_class:
-                        target_x[i, :, :, :] = data_pack[cur_class][np.random.choice(data_pack.shape[1])]
-                        target_y[i] = j
+                        ind = ind + 1
+                    # meta-test
+                    for eind in example_inds[self.samples_per_class:]:
+                        target_x[i, pinds_test[ind_test], :, :, :] = data_pack[cur_class][eind]
+                        target_y[i, pinds_test[ind_test]] = j
+                        ind_test = ind_test + 1
 
             data_cache.append([support_set_x, support_set_y, target_x, target_y])
         return data_cache
@@ -149,11 +161,11 @@ def get_batch(self,str_type, rotate_flag = False):
         if rotate_flag:
             k = int(np.random.uniform(low=0, high=4))
             # Iterate over the sequence. Extract batches.
-            for i in np.arange(x_support_set.shape[1]):
-                x_support_set[:,i,:,:,:] = self.__rotate_batch(x_support_set[:,i,:,:,:],k)
+            for i in np.arange(x_support_set.shape[0]):
+                x_support_set[i,:,:,:,:] = self.__rotate_batch(x_support_set[i,:,:,:,:],k)
             # Rotate all the batch of the target images
-            x_target = self.__rotate_batch(x_target,k)
-
+            for i in np.arange(x_target.shape[0]):
+                x_target[i,:,:,:,:] = self.__rotate_batch(x_target[i,:,:,:,:], k)
         return x_support_set, y_support_set, x_target, y_target
 
 
diff --git a/experiments/OneShotBuilder.py b/experiments/OneShotBuilder.py
@@ -90,7 +90,7 @@ def run_training_epoch(self, total_train_batches):
                 size = x_support_set.size()
                 x_support_set = x_support_set.view(size[0],size[1],size[4],size[2],size[3])
                 size = x_target.size()
-                x_target = x_target.view(size[0], size[3], size[1], size[2])
+                x_target = x_target.view(size[0],size[1],size[4],size[2],size[3])
                 if self.isCudaAvailable:
                     acc, c_loss_value = self.matchingNet(x_support_set.cuda(), y_support_set_one_hot.cuda(),
                                                          x_target.cuda(), y_target.cuda())
@@ -160,7 +160,7 @@ def run_validation_epoch(self, total_val_batches):
                 size = x_support_set.size()
                 x_support_set = x_support_set.view(size[0], size[1], size[4], size[2], size[3])
                 size = x_target.size()
-                x_target = x_target.view(size[0], size[3], size[1], size[2])
+                x_target = x_target.view(size[0],size[1],size[4],size[2],size[3])
                 if self.isCudaAvailable:
                     acc, c_loss_value = self.matchingNet(x_support_set.cuda(), y_support_set_one_hot.cuda(),
                                                          x_target.cuda(), y_target.cuda())
@@ -212,7 +212,7 @@ def run_testing_epoch(self, total_test_batches):
                 size = x_support_set.size()
                 x_support_set = x_support_set.view(size[0], size[1], size[4], size[2], size[3])
                 size = x_target.size()
-                x_target = x_target.view(size[0], size[3], size[1], size[2])
+                x_target = x_target.view(size[0],size[1],size[4],size[2],size[3])
                 if self.isCudaAvailable:
                     acc, c_loss_value = self.matchingNet(x_support_set.cuda(), y_support_set_one_hot.cuda(),
                                                          x_target.cuda(), y_target.cuda())
diff --git a/models/MatchingNetwork.py b/models/MatchingNetwork.py
@@ -62,30 +62,38 @@ def forward(self, support_set_images, support_set_labels_one_hot, target_image,
         # produce embeddings for support set images
         encoded_images = []
         for i in np.arange(support_set_images.size(1)):
-            gen_encode = self.g(support_set_images[:,i,:,:])
+            gen_encode = self.g(support_set_images[:,i,:,:,:])
             encoded_images.append(gen_encode)
 
         # produce embeddings for target images
-        gen_encode = self.g(target_image)
-        encoded_images.append(gen_encode)
-        outputs = torch.stack(encoded_images)
+        for i in np.arange(target_image.size(1)):
+            gen_encode = self.g(target_image[:,i,:,:,:])
+            encoded_images.append(gen_encode)
+            outputs = torch.stack(encoded_images)
+
+            if self.fce:
+                outputs, hn, cn = self.lstm(outputs)
 
-        if self.fce:
-            outputs, hn, cn = self.lstm(outputs)
+            # get similarity between support set embeddings and target
+            similarities = self.dn(support_set=outputs[:-1], input_image=outputs[-1])
+            similarities = similarities.t()
 
-        # get similarity between support set embeddings and target
-        similarities = self.dn(support_set=outputs[:-1], input_image=outputs[-1])
-        similarities = similarities.t()
+            # produce predictions for target probabilities
+            preds = self.classify(similarities,support_set_y=support_set_labels_one_hot)
 
-        # produce predictions for target probabilities
-        preds = self.classify(similarities,support_set_y=support_set_labels_one_hot)
+            # calculate accuracy and crossentropy loss
+            values, indices = preds.max(1)
+            if i == 0:
+                accuracy = torch.mean((indices.squeeze() == target_label[:,i]).float())
+                crossentropy_loss = F.cross_entropy(preds, target_label[:,i].long())
+            else:
+                accuracy = accuracy + torch.mean((indices.squeeze() == target_label[:, i]).float())
+                crossentropy_loss = accuracy + F.cross_entropy(preds, target_label[:, i].long())
 
-        # calculate accuracy and crossentropy loss
-        values, indices = preds.max(1)
-        accuracy = torch.mean((indices.squeeze() == target_label).float())
-        crossentropy_loss = F.cross_entropy(preds, target_label.long())
+            # delete the last target image encoding of encoded_images
+            encoded_images.pop()
 
-        return accuracy, crossentropy_loss
+        return accuracy/target_image.size(1), crossentropy_loss/target_image.size(1)
 
 
 class MatchingNetworkTest(unittest.TestCase):