changebio
diff --git a/‎data/classifier/after_conv1_encoder.npy
1.32 MB b/‎data/classifier/after_conv1_encoder.npy
1.32 MB
diff --git a/‎data/classifier/after_conv2_encoder.npy
288 KB b/‎data/classifier/after_conv2_encoder.npy
288 KB
diff --git a/‎data/classifier/after_conv3_encoder.npy
32.1 KB b/‎data/classifier/after_conv3_encoder.npy
32.1 KB
diff --git a/‎data/classifier/after_conv4_encoder.npy
8.08 KB b/‎data/classifier/after_conv4_encoder.npy
8.08 KB
diff --git a/‎data/classifier/bn1_beta.npy
336 Bytes b/‎data/classifier/bn1_beta.npy
336 Bytes
diff --git a/‎data/classifier/bn1_gamma.npy
336 Bytes b/‎data/classifier/bn1_gamma.npy
336 Bytes
diff --git a/‎data/classifier/bn2_beta.npy
336 Bytes b/‎data/classifier/bn2_beta.npy
336 Bytes
diff --git a/‎data/classifier/bn2_gamma.npy
336 Bytes b/‎data/classifier/bn2_gamma.npy
336 Bytes
diff --git a/‎data/classifier/bn3_beta.npy
336 Bytes b/‎data/classifier/bn3_beta.npy
336 Bytes
diff --git a/‎data/classifier/bn3_gamma.npy
336 Bytes b/‎data/classifier/bn3_gamma.npy
336 Bytes
diff --git a/‎data/classifier/bn4_beta.npy
336 Bytes b/‎data/classifier/bn4_beta.npy
336 Bytes
diff --git a/‎data/classifier/bn4_gamma.npy
336 Bytes b/‎data/classifier/bn4_gamma.npy
336 Bytes
diff --git a/‎data/classifier/conv1_bias.npy
336 Bytes b/‎data/classifier/conv1_bias.npy
336 Bytes
diff --git a/‎data/classifier/conv1_encoder_conv2d.npy
5.28 MB b/‎data/classifier/conv1_encoder_conv2d.npy
5.28 MB
diff --git a/‎data/classifier/conv1_weigths.npy
2.33 KB b/‎data/classifier/conv1_weigths.npy
2.33 KB
diff --git a/‎data/classifier/conv2_bias.npy
336 Bytes b/‎data/classifier/conv2_bias.npy
336 Bytes
diff --git a/‎data/classifier/conv2_weigths.npy
144 KB b/‎data/classifier/conv2_weigths.npy
144 KB
diff --git a/‎data/classifier/conv3_bias.npy
336 Bytes b/‎data/classifier/conv3_bias.npy
336 Bytes
diff --git a/‎data/classifier/conv3_weigths.npy
144 KB b/‎data/classifier/conv3_weigths.npy
144 KB
diff --git a/‎data/classifier/conv4_bias.npy
336 Bytes b/‎data/classifier/conv4_bias.npy
336 Bytes
diff --git a/‎data/classifier/conv4_weigths.npy
64.1 KB b/‎data/classifier/conv4_weigths.npy
64.1 KB
diff --git a/‎data/classifier/image_input.npy
98.1 KB b/‎data/classifier/image_input.npy
98.1 KB
diff --git a/‎datasets/omniglotNShot.py
+3 b/‎datasets/omniglotNShot.py
+3
diff --git a/‎datasets/omniglotNShot.pyc
1.42 KB b/‎datasets/omniglotNShot.pyc
1.42 KB
diff --git a/‎main.py
+3-3 b/‎main.py
+3-3
diff --git a/‎models/Classifier.py
+64-19 b/‎models/Classifier.py
+64-19
@@ -41,6 +41,9 @@ def __init__(self, dataroot, batch_size = 100, classes_per_set=10, samples_per_c
             np.save(os.path.join(dataroot,'data.npy'),self.x)
         else:
             self.x = np.load(os.path.join(dataroot,'data.npy'))
+            # LOAD TENSORFLOW DATA IMPLEMENTATION
+            #self.x = np.load('/home/aberenguel/TensorFlow/MatchingNetworks/data.npy')
+            #self.x = np.reshape(self.x, [-1, 20, 28, 28, 1])
 
         """
         Constructs an N-Shot omniglot Dataset
 
@@ -15,19 +15,19 @@
 
 # Experiment Setup
 batch_size = 32
-fce = True
+fce = False
 classes_per_set = 20
 samples_per_class = 1
 channels = 1
 # Training setup
-total_epochs = 300
+total_epochs = 500
 total_train_batches = 1000
 total_val_batches = 100
 total_test_batches = 250
 # Parse other options
 args = Options().parse()
 
-LOG_DIR = args.log_dir + '/run-batchSize_{}-fce_{}-classes_per_set{}-samples_per_class{}-channels{}' \
+LOG_DIR = args.log_dir + '/3_run-batchSize_{}-fce_{}-classes_per_set{}-samples_per_class{}-channels{}' \
     .format(batch_size,fce,classes_per_set,samples_per_class,channels)
 
 # create logger
 
@@ -1,5 +1,6 @@
 import torch
 import torch.nn as nn
+import torch.nn.init as init
 from torch.autograd import Variable
 import unittest
 import numpy as np
@@ -11,11 +12,12 @@ def convLayer(in_planes, out_planes, stride=1, padding = 1, bias = True):
     return nn.Sequential(
         nn.Conv2d(in_planes, out_planes, kernel_size=3,
                   stride=stride, padding=padding, bias=bias),
+        #nn.LeakyReLU(0.2),
         nn.LeakyReLU(),
         nn.BatchNorm2d(out_planes),
-        # nn.MaxPool2d(kernel_size=2, stride=2,ceil_mode=True),
+        #nn.MaxPool2d(kernel_size=2, stride=2,ceil_mode=True),
         nn.MaxPool2d(kernel_size=2, stride=2),
-        nn.Dropout()
+        nn.Dropout(0.1)
     )
 
 
@@ -37,32 +39,47 @@ def __init__(self, layer_sizes, num_channels = 1, keep_prob = 0.5):
         self.layer3 = convLayer(layer_sizes[1], layer_sizes[2])
         self.layer4 = convLayer(layer_sizes[2], layer_sizes[3])
 
+
         self.weights_init(self.layer1)
         self.weights_init(self.layer2)
         self.weights_init(self.layer3)
         self.weights_init(self.layer4)
         '''
-        # Module initialization
-        for m in self.modules():
+        self.weights_init_tensorflow(self.layer1,1)
+        self.weights_init_tensorflow(self.layer2,2)
+        self.weights_init_tensorflow(self.layer3,3)
+        self.weights_init_tensorflow(self.layer4,4)
+        '''
+
+    def weights_init(self,module):
+        #for m in self.modules():
+        for m in module.modules():
             if isinstance(m, nn.Conv2d):
-                n = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
-                m.weight.data.normal_(0, math.sqrt(2. / n))
+                init.xavier_uniform(m.weight, gain=np.sqrt(2))
+                init.constant(m.bias, 0)
+                ##m.weight.data.normal_(0.0, 0.02)
+                #n = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
+                #m.weight.data.normal_(0, math.sqrt(2. / n))
             elif isinstance(m, nn.BatchNorm2d):
+                #m.weight.data.normal_(1.0, 0.02)
+                #m.bias.data.fill_(0)
                 m.weight.data.fill_(1)
                 m.bias.data.zero_()
-        '''
 
-    def weights_init(self,m):
-        for m in self.modules():
+    def weights_init_tensorflow(self,module,layer):
+        #for m in self.modules():
+        for m in module.modules():
             if isinstance(m, nn.Conv2d):
-                m.weight.data.normal_(0.0, 0.02)
-                #n = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
-                #m.weight.data.normal_(0, math.sqrt(2. / n))
+                m.weight.data = torch.from_numpy(np.load('/home/aberenguel/pytorch/examples/MatchingNetworks/data/classifier/conv' + str(layer) + '_weigths.npy').transpose((3,2,1,0)))
+                m.weight.data = m.weight.data.contiguous()
+                m.bias.data = torch.from_numpy(np.load('/home/aberenguel/pytorch/examples/MatchingNetworks/data/classifier/conv' + str(layer) + '_bias.npy'))
             elif isinstance(m, nn.BatchNorm2d):
-                m.weight.data.normal_(1.0, 0.02)
-                m.bias.data.fill_(0)
-                #m.weight.data.fill_(1)
-                #m.bias.data.zero_()
+                m.weight.data = torch.from_numpy(np.load(
+                    '/home/aberenguel/pytorch/examples/MatchingNetworks/data/classifier/bn' + str(
+                        layer) + '_gamma.npy'))
+                m.bias.data = torch.from_numpy(np.load(
+                    '/home/aberenguel/pytorch/examples/MatchingNetworks/data/classifier/bn' + str(
+                        layer) + '_beta.npy'))
 
 
     def forward(self, image_input):
@@ -71,19 +88,20 @@ def forward(self, image_input):
         :param image_input: Image input to produce embeddings for. [batch_size, 28, 28, 1]
         :return: Embeddings of size [batch_size, 64]
         """
-        # TODO: What is better 2 padding at first conv2d or 1 padding in the last layer of conv2d??
-        #x = nn.Conv2d(1, 64, kernel_size=3, stride=1, bias=True).cuda()(image_input)
+
+        #x = nn.Conv2d(1, 64, kernel_size=3, stride=1, padding=0, bias=True).cuda()(image_input)
         #x = nn.LeakyReLU().cuda()(x)
         #x = nn.BatchNorm2d(64).cuda()(x)
         #x = nn.MaxPool2d(kernel_size=2, stride=2).cuda()(x)
         #x = nn.Dropout().cuda()(x)
 
+        #check = np.sum(self.layer1[0](image_input).data.cpu().numpy())
+
         x = self.layer1(image_input)
         x = self.layer2(x)
         x = self.layer3(x)
         x = self.layer4(x)
         x = torch.squeeze(x)
-        # TODO: flat output
         return x
 
 
@@ -94,11 +112,38 @@ def setUp(self):
         self.outputs = np.load('../data/gen_encode.npy')
         self.layer_sizes = [64,64,64,64]
 
+        self.after_conv1 = np.load(
+            '/home/aberenguel/pytorch/examples/MatchingNetworks/data/classifier/after_conv1_encoder.npy')
+        self.after_conv2 = np.load(
+            '/home/aberenguel/pytorch/examples/MatchingNetworks/data/classifier/after_conv2_encoder.npy')
+        self.after_conv3 = np.load(
+            '/home/aberenguel/pytorch/examples/MatchingNetworks/data/classifier/after_conv3_encoder.npy')
+        self.after_conv4 = np.load(
+            '/home/aberenguel/pytorch/examples/MatchingNetworks/data/classifier/after_conv4_encoder.npy')
+        self.image_input = np.load(
+            '/home/aberenguel/pytorch/examples/MatchingNetworks/data/classifier/image_input.npy')
+
     def tearDown(self):
         pass
 
     def test_forward(self):
         classifier = Classifier(layer_sizes=self.layer_sizes).cuda()
+
+        print("sum conv1 tf: %f" % np.sum(self.after_conv1))
+        print("sum conv2 tf: %f" % np.sum(self.after_conv2))
+        print("sum conv3 tf: %f" % np.sum(self.after_conv3))
+        print("sum conv4 tf: %f" % np.sum(self.after_conv4))
+        input = Variable(torch.from_numpy(self.image_input.transpose((0,3,1,2))).cuda(), requires_grad=True)
+
+        x1 = classifier.layer1(input)
+        print("sum conv1 pytorch: %f" % torch.sum(x1).data[0])
+        x2 = classifier.layer2(x1)
+        print("sum conv2 pytorch: %f" % torch.sum(x2).data[0])
+        x3 = classifier.layer3(x2)
+        print("sum conv2 pytorch: %f" % torch.sum(x3).data[0])
+        x4 = classifier.layer4(x3)
+        print("sum conv2 pytorch: %f" % torch.sum(x4).data[0])
+
         input = Variable(torch.from_numpy(self.inputs).cuda(), requires_grad=True)
         output = classifier(input)
         # TODO: why the output contains so many 0? The self.outputs d