From 2199039ba822a48932a8b79ffbd9cd9c47c0e784 Mon Sep 17 00:00:00 2001
From: Jia Guo <guojia@gmail.com>
Date: Wed, 29 Nov 2017 17:04:05 +0800
Subject: [PATCH] refine

---
 src/common/face_image.py      |   2 +-
 src/common/face_preprocess.py |  31 +-
 src/data.py                   | 577 +++++++++++++++++++++++++++-------
 src/{ => eval}/lfw.py         |  89 +++++-
 src/marginalnet.py            |  29 +-
 src/train_softmax.py          | 157 ++-------
 6 files changed, 611 insertions(+), 274 deletions(-)
 rename src/{ => eval}/lfw.py (71%)

diff --git a/src/common/face_image.py b/src/common/face_image.py
index 035d13a..e169d50 100644
--- a/src/common/face_image.py
+++ b/src/common/face_image.py
@@ -114,7 +114,7 @@ def get_dataset_common(input_dir):
   return ret
 
 def get_dataset(name, input_dir):
-  if name=='webface' or name=='lfw':
+  if name=='webface' or name=='lfw' or name=='vgg':
     return get_dataset_common(input_dir)
   if name=='celeb':
     return get_dataset_celeb(input_dir)
diff --git a/src/common/face_preprocess.py b/src/common/face_preprocess.py
index 5271877..1c9525b 100644
--- a/src/common/face_preprocess.py
+++ b/src/common/face_preprocess.py
@@ -49,13 +49,25 @@ def preprocess(img, bbox=None, landmark=None, **kwargs):
   if isinstance(img, str):
     img = read_image(img, **kwargs)
   M = None
+  image_size = []
+  str_image_size = kwargs.get('image_size', '')
+  if len(str_image_size)>0:
+    image_size = [int(x) for x in str_image_size.split(',')]
+    if len(image_size)==1:
+      image_size = [image_size[0], image_size[0]]
+    assert len(image_size)==2
+    assert image_size[0]==112
+    assert image_size[0]==112 or image_size[1]==96
   if landmark is not None:
+    assert len(image_size)==2
     src = np.array([
       [30.2946, 51.6963],
       [65.5318, 51.5014],
       [48.0252, 71.7366],
       [33.5493, 92.3655],
       [62.7299, 92.2041] ], dtype=np.float32 )
+    if image_size[1]==112:
+      src[:,0] += 8.0
     dst = landmark.astype(np.float32)
 
     tform = trans.SimilarityTransform()
@@ -78,16 +90,12 @@ def preprocess(img, bbox=None, landmark=None, **kwargs):
     bb[1] = np.maximum(det[1]-margin/2, 0)
     bb[2] = np.minimum(det[2]+margin/2, img.shape[1])
     bb[3] = np.minimum(det[3]+margin/2, img.shape[0])
-    cropped = img[bb[1]:bb[3],bb[0]:bb[2],:]
-    str_image_size = kwargs.get('image_size', '')
-    if len(str_image_size)>0:
-      image_size = [int(x) for x in str_image_size.split(',')]
-      if len(image_size)==1:
-        image_size = [image_size[0], image_size[0]]
-      assert len(image_size)==2
-    scaled = cv2.resize(cropped, (image_size[1], image_size[0]))
-    return scaled
+    ret = img[bb[1]:bb[3],bb[0]:bb[2],:]
+    if len(image_size)>0:
+      ret = cv2.resize(ret, (image_size[1], image_size[0]))
+    return ret 
   else: #do align using landmark
+    assert len(image_size)==2
 
     #src = src[0:3,:]
     #dst = dst[0:3,:]
@@ -96,11 +104,8 @@ def preprocess(img, bbox=None, landmark=None, **kwargs):
     #print(src.shape, dst.shape)
     #print(src)
     #print(dst)
-    _shape = [int(x) for x in kwargs.get('image_size').split(',')]
-    #print(_shape)
-    #M = cv2.getAffineTransform(src,dst)
     #print(M)
-    warped = cv2.warpAffine(img,M,(_shape[1],_shape[0]), borderValue = 0.0)
+    warped = cv2.warpAffine(img,M,(image_size[1],image_size[0]), borderValue = 0.0)
 
     #tform3 = trans.ProjectiveTransform()
     #tform3.estimate(src, dst)
diff --git a/src/data.py b/src/data.py
index 0e64edd..469e3c4 100644
--- a/src/data.py
+++ b/src/data.py
@@ -27,118 +27,140 @@ import face_preprocess
 
 logger = logging.getLogger()
 
-#modification on ImageIter
 class FaceImageIter(io.DataIter):
 
-    def __init__(self, batch_size, data_shape, images_per_person, margin = 44, path_imglist=None, path_root=None,
-                 shuffle=False, aug_list=None,
+    def __init__(self, batch_size, data_shape,
+                 path_imgrec = None,
+                 shuffle=False, aug_list=None, mean = None,
+                 rand_mirror = False,
                  data_name='data', label_name='softmax_label', **kwargs):
         super(FaceImageIter, self).__init__()
-        assert path_imglist
-        self.label2key = {}
-        self.labelkeys = []
-        print('loading image list...')
-        with open(path_imglist) as fin:
-            imglist = {}
-            imgkeys = []
-            key = 0
-            for line in iter(fin.readline, ''):
-                line = line.strip().split('\t')
-                if len(line)<17:
-                  continue #skip no detected face image
-                label = nd.array([float(line[2])])
-                ilabel = int(line[2])
-                if ilabel not in self.label2key:
-                  self.label2key[ilabel] = [key]
-                  self.labelkeys.append(ilabel)
-                  #self.labelcur[ilabel] = 0
-                else:
-                  self.label2key[ilabel].append(key)
-                #label = nd.array([float(i) for i in line[1:-1]])
-                bbox = np.array([int(i) for i in line[3:7]])
-                #key = int(line[0])
-                imglist[key] = (label, line[1], bbox)
-                imgkeys.append(key)
-                key+=1
-            self.imglist = imglist
-        print('image list size', len(self.imglist))
+        assert path_imgrec
+        if path_imgrec:
+            logging.info('loading recordio %s...',
+                         path_imgrec)
+            path_imgidx = path_imgrec[0:-4]+".idx"
+            self.imgrec = recordio.MXIndexedRecordIO(path_imgidx, path_imgrec, 'r')  # pylint: disable=redefined-variable-type
+            s = self.imgrec.read_idx(0)
+            header, _ = recordio.unpack(s)
+            if header.flag>0:
+              print('header0 label', header.label)
+              #assert(header.flag==1)
+              self.imgidx = range(1, int(header.label[0]))
+              self.idx2range = {}
+              self.seq_identity = range(int(header.label[0]), int(header.label[1]))
+              for identity in self.seq_identity:
+                s = self.imgrec.read_idx(identity)
+                header, _ = recordio.unpack(s)
+                #print('flag', header.flag)
+                #print(header.label)
+                #assert(header.flag==2)
+                self.idx2range[identity] = (int(header.label[0]), int(header.label[1]))
+              print('idx2range', len(self.idx2range))
+            else:
+              self.imgidx = list(self.imgrec.keys)
+            if shuffle:
+              self.seq = self.imgidx
+            else:
+              self.seq = None
 
-        self.path_root = path_root
-        self.margin = margin
+        self.mean = mean
+        self.nd_mean = None
+        if self.mean:
+          self.mean = np.array(self.mean, dtype=np.float32).reshape(1,1,3)
+          self.nd_mean = mx.nd.array(self.mean).reshape((1,1,3))
 
         self.check_data_shape(data_shape)
         self.provide_data = [(data_name, (batch_size,) + data_shape)]
         self.provide_label = [(label_name, (batch_size,))]
         self.batch_size = batch_size
         self.data_shape = data_shape
-        self.images_per_person = images_per_person
-        #self.label_width = label_width
-        self.imgkeys = imgkeys
         self.shuffle = shuffle
+        self.image_size = '%d,%d'%(data_shape[1],data_shape[2])
+        self.rand_mirror = rand_mirror
+        #self.cast_aug = mx.image.CastAug()
+        #self.color_aug = mx.image.ColorJitterAug(0.4, 0.4, 0.4)
 
-        if aug_list is None:
-            self.auglist = mx.image.CreateAugmenter(data_shape, **kwargs)
-        else:
-            self.auglist = aug_list
-        print('aug size:', len(self.auglist))
-        #for aug in self.auglist:
-        #  print(aug.__name__)
         self.cur = 0
-        self.labelcur = 0
         self.reset()
 
     def reset(self):
         """Resets the iterator to the beginning of the data."""
+        print('call reset()')
         if self.shuffle:
-            #random.shuffle(self.imgkeys)
-            random.shuffle(self.labelkeys)
+            random.shuffle(self.seq)
+        if self.imgrec is not None:
+            self.imgrec.reset()
         self.cur = 0
-        self.labelcur = 0
-        #for k in self.label2key:
-        #  random.shuffle(self.label2key[k])
 
-    def _next_sample(self):
-        """Helper function for reading in next sample."""
-        #set total batch size, for example, 1800, and maximum size for each people, for example 45
-        while True:
-          if self.cur >= len(self.labelkeys):
-            raise StopIteration
-          ilabel = self.labelkeys[self.cur]
-          if self.labelcur>=min(len(self.label2key[ilabel]), self.images_per_person):
-            self.labelcur=0
-            self.cur+=1
-          else:
-            idx = self.label2key[ilabel][self.labelcur]
-            self.labelcur += 1
-            label, fname, bbox = self.imglist[idx]
-            return label, self.read_image(fname), bbox
+    def num_samples(self):
+      return len(self.seq)
 
     def next_sample(self):
         """Helper function for reading in next sample."""
         #set total batch size, for example, 1800, and maximum size for each people, for example 45
-        while True:
-          if self.cur >= len(self.labelkeys):
-            raise StopIteration
-          ilabel = self.labelkeys[self.cur]
-          if self.labelcur>=min(len(self.label2key[ilabel]), self.images_per_person):
-            self.labelcur=0
-            self.cur+=1
+        if self.seq is not None:
+          if self.cur >= len(self.seq):
+              raise StopIteration
+          idx = self.seq[self.cur]
+          self.cur += 1
+          if self.imgrec is not None:
+            s = self.imgrec.read_idx(idx)
+            header, img = recordio.unpack(s)
+            return header.label, img, None, None
           else:
-            #print('in next_sample', self.cur, self.labelcur)
-            if self.labelcur==0 and self.shuffle:
-              #print('shuffling')
-              random.shuffle(self.label2key[ilabel])
-            idx = self.label2key[ilabel][self.labelcur]
-            self.labelcur += 1
-            label, fname, bbox = self.imglist[idx]
-            return label, self.read_image(fname), bbox
+            label, fname, bbox, landmark = self.imglist[idx]
+            return label, self.read_image(fname), bbox, landmark
+        else:
+            s = self.imgrec.read()
+            if s is None:
+                raise StopIteration
+            header, img = recordio.unpack(s)
+            return header.label, img, None, None
+
+    def brightness_aug(self, src, x):
+      alpha = 1.0 + random.uniform(-x, x)
+      src *= alpha
+      return src
+
+    def contrast_aug(self, src, x):
+      alpha = 1.0 + random.uniform(-x, x)
+      coef = np.array([[[0.299, 0.587, 0.114]]])
+      gray = src * coef
+      gray = (3.0 * (1.0 - alpha) / gray.size) * np.sum(gray)
+      src *= alpha
+      src += gray
+      return src
+
+    def saturation_aug(self, src, x):
+      alpha = 1.0 + random.uniform(-x, x)
+      coef = np.array([[[0.299, 0.587, 0.114]]])
+      gray = src * coef
+      gray = np.sum(gray, axis=2, keepdims=True)
+      gray *= (1.0 - alpha)
+      src *= alpha
+      src += gray
+      return src
+
+    def color_aug(self, img, x):
+      augs = [self.brightness_aug, self.contrast_aug, self.saturation_aug]
+      random.shuffle(augs)
+      for aug in augs:
+        #print(img.shape)
+        img = aug(img, x)
+        #print(img.shape)
+      return img
+
+    def mirror_aug(self, img):
+      _rd = random.randint(0,1)
+      if _rd==1:
+        for c in xrange(img.shape[2]):
+          img[:,:,c] = np.fliplr(img[:,:,c])
+      return img
+
 
     def next(self):
         """Returns the next batch of data."""
-        if self.shuffle:
-            random.shuffle(self.labelkeys)
-            self.cur = 0
-            self.labelcur = 0
         #print('in next', self.cur, self.labelcur)
         batch_size = self.batch_size
         c, h, w = self.data_shape
@@ -147,23 +169,48 @@ class FaceImageIter(io.DataIter):
         i = 0
         try:
             while i < batch_size:
-                label, s, bbox = self.next_sample()
-                data = [self.imdecode(s, bbox)]
+                label, s, bbox, landmark = self.next_sample()
+                _data = self.imdecode(s)
+                if self.rand_mirror:
+                  _rd = random.randint(0,1)
+                  if _rd==1:
+                    _data = mx.ndarray.flip(data=_data, axis=1)
+                if self.nd_mean is not None:
+                    _data = _data.astype('float32')
+                    _data -= self.nd_mean
+                    _data *= 0.0078125
+                #_npdata = _data.asnumpy()
+                #if landmark is not None:
+                #  _npdata = face_preprocess.preprocess(_npdata, bbox = bbox, landmark=landmark, image_size=self.image_size)
+                #if self.rand_mirror:
+                #  _npdata = self.mirror_aug(_npdata)
+                #if self.mean is not None:
+                #  _npdata = _npdata.astype(np.float32)
+                #  _npdata -= self.mean
+                #  _npdata *= 0.0078125
+                #nimg = np.zeros(_npdata.shape, dtype=np.float32)
+                #nimg[self.patch[1]:self.patch[3],self.patch[0]:self.patch[2],:] = _npdata[self.patch[1]:self.patch[3], self.patch[0]:self.patch[2], :]
+                #_data = mx.nd.array(nimg)
+                data = [_data]
                 try:
                     self.check_valid_image(data)
                 except RuntimeError as e:
                     logging.debug('Invalid image, skipping:  %s', str(e))
                     continue
-                data = self.augmentation_transform(data)
+                #print('aa',data[0].shape)
+                #data = self.augmentation_transform(data)
+                #print('bb',data[0].shape)
                 for datum in data:
                     assert i < batch_size, 'Batch size must be multiples of augmenter output length'
+                    #print(datum.shape)
                     batch_data[i][:] = self.postprocess_data(datum)
                     batch_label[i][:] = label
                     i += 1
         except StopIteration:
-            if not i:
+            if i<batch_size:
                 raise StopIteration
 
+        #print('next end', batch_size, i)
         return io.DataBatch([batch_data], [batch_label], batch_size - i)
 
     def check_data_shape(self, data_shape):
@@ -178,15 +225,10 @@ class FaceImageIter(io.DataIter):
         if len(data[0].shape) == 0:
             raise RuntimeError('Data shape is wrong')
 
-    def imdecode(self, s, bbox):
+    def imdecode(self, s):
         """Decodes a string or byte string to an NDArray.
         See mx.img.imdecode for more details."""
-        img = mx.image.imdecode(s)
-        if bbox is not None:
-          #print(img.shape, bbox)
-          _begin = (max(0, bbox[1]-self.margin//2), max(0, bbox[0]-self.margin//2),0)
-          _end = (min(img.shape[0], bbox[3]+self.margin//2), min(img.shape[1], bbox[2]+self.margin//2), 3)
-          img = nd.slice(img, begin=_begin, end=_end)
+        img = mx.image.imdecode(s) #mx.ndarray
         return img
 
     def read_image(self, fname):
@@ -642,6 +684,314 @@ class FaceImageIter2(io.DataIter):
         """Final postprocessing step before image is loaded into the batch."""
         return nd.transpose(datum, axes=(2, 0, 1))
 
+class FaceImageIter3(io.DataIter):
+
+    def __init__(self, batch_size, ctx_num, images_per_identity, data_shape,
+                 path_imgrec = None,
+                 shuffle=False, mean = None, use_extra = False, model = None,
+                 patch = [0,0,96,112,0], rand_mirror = False,
+                 data_name='data', label_name='softmax_label', **kwargs):
+        super(FaceImageIter3, self).__init__()
+        assert(path_imgrec)
+        logging.info('loading recordio %s...',
+                     path_imgrec)
+        path_imgidx = path_imgrec[0:-4]+".idx"
+        self.imgrec = recordio.MXIndexedRecordIO(path_imgidx, path_imgrec, 'r')  # pylint: disable=redefined-variable-type
+        #self.imgidx = list(self.imgrec.keys)
+        s = self.imgrec.read_idx(0)
+        header, _ = recordio.unpack(s)
+        assert(header.flag==1)
+        self.seq = range(1, int(header.label[0]))
+        self.idx2range = {}
+        self.seq_identity = range(int(header.label[0]), int(header.label[1]))
+        for identity in self.seq_identity:
+          s = self.imgrec.read_idx(identity)
+          header, _ = recordio.unpack(s)
+          assert(header.flag==2)
+          self.idx2range[identity] = (int(header.label[0]), int(header.label[1]))
+        print('idx2range', len(idx2range))
+
+
+        self.path_root = path_root
+        self.mean = mean
+        self.nd_mean = None
+        if self.mean:
+          self.mean = np.array(self.mean, dtype=np.float32).reshape(1,1,3)
+          self.nd_mean = mx.nd.array(self.mean).reshape((1,1,3))
+        self.patch = patch
+
+        self.check_data_shape(data_shape)
+        self.provide_data = [(data_name, (batch_size,) + data_shape)]
+        self.provide_label = [(label_name, (batch_size,))]
+        self.batch_size = batch_size
+        self.data_shape = data_shape
+        self.shuffle = shuffle
+        self.image_size = '%d,%d'%(data_shape[1],data_shape[2])
+        self.rand_mirror = rand_mirror
+        self.ctx_num = ctx_num 
+        self.images_per_identity = images_per_identity
+        self.identities = int(per_batch_size/self.images_per_identity)
+        self.min_per_identity = 1
+        assert self.min_per_identity<=self.images_per_identity
+        print(self.images_per_identity, self.identities, self.min_per_identity)
+        self.extra = None
+        self.model = model
+        if use_extra:
+          self.provide_data = [(data_name, (batch_size,) + data_shape), ('extra', (batch_size, per_batch_size))]
+          self.extra = np.full(self.provide_data[1][1], -1.0, dtype=np.float32)
+          c = 0
+          while c<batch_size:
+            a = 0
+            while a<per_batch_size:
+              b = a+images_per_identity
+              self.extra[(c+a):(c+b),a:b] = 1.0
+              #print(c+a, c+b, a, b)
+              a = b
+            c += per_batch_size
+          self.extra = nd.array(self.extra)
+          print(self.extra)
+        else:
+          self.provide_data = [(data_name, (batch_size,) + data_shape)]
+        self.cur = [0,0]
+        self.reset()
+        self.inited = False
+
+    def offline_reset(self):
+      self.seq_sim_identity = []
+      data = nd.zeros( self.provide_data[0][1] )
+      label = nd.zeros( self.provide_label[0][1] )
+      #label = np.zeros( self.provide_label[0][1] )
+      X = None
+      ba = 0
+      batch_num = 0
+      while ba<len(self.seq):
+        batch_num+=1
+        if batch_num%10==0:
+          print('loading batch',batch_num, ba)
+        bb = min(ba+self.batch_size, len(self.seq))
+        _count = bb-ba
+        for i in xrange(_count):
+          key = self.seq[i+ba]
+          _label, fname, bbox, landmark = self.imglist[key]
+          s = self.read_image(fname)
+          _data = self.imdecode(s)
+          #_data = self.augmentation_transform([_data])[0]
+          _npdata = _data.asnumpy()
+          if landmark is not None:
+            _npdata = face_preprocess.preprocess(_npdata, bbox = bbox, landmark=landmark, image_size=self.image_size)
+          if self.mean is not None:
+            _npdata = _npdata.astype(np.float32)
+            _npdata -= self.mean
+            _npdata *= 0.0078125
+          nimg = np.zeros(_npdata.shape, dtype=np.float32)
+          nimg[self.patch[1]:self.patch[3],self.patch[0]:self.patch[2],:] = _npdata[self.patch[1]:self.patch[3], self.patch[0]:self.patch[2], :]
+          #print(_npdata.shape)
+          #print(_npdata)
+          _data = mx.nd.array(nimg)
+          data[i][:] = self.postprocess_data(_data)
+          label[i][:] = _label
+        db = mx.io.DataBatch(data=(data,self.extra), label=(label,))
+        self.model.forward(db, is_train=False)
+        net_out = self.model.get_outputs()
+        _embeddings = net_out[0].asnumpy()
+        _embeddings = sklearn.preprocessing.normalize(_embeddings)
+        if _count<self.batch_size:
+          _embeddings = _embeddings[0:_count,:]
+        #print(_embeddings.shape)
+        if X is None:
+          X = np.zeros( (len(self.olabels), _embeddings.shape[1]), dtype=np.float32 )
+        nplabel = label.asnumpy()
+        for i in xrange(_count):
+          ilabel = int(nplabel[i])
+          #print(ilabel, ilabel.__class__)
+          X[ilabel] += _embeddings[i]
+        ba = bb
+      X = sklearn.preprocessing.normalize(X)
+      d = X.shape[1]
+      faiss_params = [20,5]
+      print('start to train faiss')
+      print(X.shape)
+      quantizer = faiss.IndexFlatL2(d)  # the other index
+      index = faiss.IndexIVFFlat(quantizer, d, faiss_params[0], faiss.METRIC_L2)
+      assert not index.is_trained
+      index.train(X)
+      index.add(X)
+      assert index.is_trained
+      print('trained')
+      index.nprobe = faiss_params[1]
+      k = self.identities
+      D, I = index.search(X, k)     # actual search
+      print(I.shape)
+      self.labels = []
+      for i in xrange(I.shape[0]):
+        #assert I[i][0]==i
+        for j in xrange(k):
+          _label = I[i][j]
+          assert _label<len(self.olabels)
+          self.labels.append(_label)
+      print('labels assigned', len(self.labels))
+
+    def reset(self):
+        """Resets the iterator to the beginning of the data."""
+        print('call reset()')
+        if self.shuffle:
+            offline_reset()
+            random.shuffle(self.seq)
+            random.shuffle(self.seq_identity)
+        if self.imgrec is not None:
+            self.imgrec.reset()
+        self.cur = [0,0]
+
+    def num_samples(self):
+      return len(self.seq)
+
+    def next_sample(self):
+        """Helper function for reading in next sample."""
+        #set total batch size, for example, 1800, and maximum size for each people, for example 45
+        while True:
+          if self.cur[0] >= len(self.seq_sim_identity):
+              raise StopIteration
+          identity = self.seq_sim_identity[self.cur[0]]
+          if self.cur[1]>=self.images_per_identity:
+            self.cur[0]+=1
+            self.cur[1]=0
+            s = self.imgrec.read_idx(identity)
+            header, _ = recordio.unpack(s)
+            self.idx_range = range(int(header.label[0]), int(header.label[1]))
+            continue
+          if self.shuffle and self.cur[1]==0:
+            random.shuffle(self.idx_range)
+          idx = self.idx_range[self.cur[1]]
+          self.cur[1] += 1
+          s = self.imgrec.read_idx(idx)
+          header, img = recordio.unpack(s)
+          return header.label, img, None, None
+
+
+    def brightness_aug(self, src, x):
+      alpha = 1.0 + random.uniform(-x, x)
+      src *= alpha
+      return src
+
+    def contrast_aug(self, src, x):
+      alpha = 1.0 + random.uniform(-x, x)
+      coef = np.array([[[0.299, 0.587, 0.114]]])
+      gray = src * coef
+      gray = (3.0 * (1.0 - alpha) / gray.size) * np.sum(gray)
+      src *= alpha
+      src += gray
+      return src
+
+    def saturation_aug(self, src, x):
+      alpha = 1.0 + random.uniform(-x, x)
+      coef = np.array([[[0.299, 0.587, 0.114]]])
+      gray = src * coef
+      gray = np.sum(gray, axis=2, keepdims=True)
+      gray *= (1.0 - alpha)
+      src *= alpha
+      src += gray
+      return src
+
+    def color_aug(self, img, x):
+      augs = [self.brightness_aug, self.contrast_aug, self.saturation_aug]
+      random.shuffle(augs)
+      for aug in augs:
+        #print(img.shape)
+        img = aug(img, x)
+        #print(img.shape)
+      return img
+
+    def mirror_aug(self, img):
+      _rd = random.randint(0,1)
+      if _rd==1:
+        for c in xrange(img.shape[2]):
+          img[:,:,c] = np.fliplr(img[:,:,c])
+      return img
+
+
+    def next(self):
+        if not self.inited:
+          self.reset()
+          self.inited = True
+        """Returns the next batch of data."""
+        #print('in next', self.cur, self.labelcur)
+        batch_size = self.batch_size
+        c, h, w = self.data_shape
+        batch_data = nd.empty((batch_size, c, h, w))
+        batch_label = nd.empty(self.provide_label[0][1])
+        i = 0
+        try:
+            while i < batch_size:
+                label, s, bbox, landmark = self.next_sample()
+                _data = self.imdecode(s)
+                if self.rand_mirror:
+                  _rd = random.randint(0,1)
+                  if _rd==1:
+                    _data = mx.ndarray.flip(data=_data, axis=1)
+                if self.nd_mean is not None:
+                    _data = _data.astype('float32')
+                    _data -= self.nd_mean
+                    _data *= 0.0078125
+                data = [_data]
+                try:
+                    self.check_valid_image(data)
+                except RuntimeError as e:
+                    logging.debug('Invalid image, skipping:  %s', str(e))
+                    continue
+                #print('aa',data[0].shape)
+                #data = self.augmentation_transform(data)
+                #print('bb',data[0].shape)
+                for datum in data:
+                    assert i < batch_size, 'Batch size must be multiples of augmenter output length'
+                    #print(datum.shape)
+                    batch_data[i][:] = self.postprocess_data(datum)
+                    batch_label[i][:] = label
+                    i += 1
+        except StopIteration:
+            if i<batch_size:
+                raise StopIteration
+
+        #print('next end', batch_size, i)
+        return io.DataBatch([batch_data], [batch_label], batch_size - i)
+
+    def check_data_shape(self, data_shape):
+        """Checks if the input data shape is valid"""
+        if not len(data_shape) == 3:
+            raise ValueError('data_shape should have length 3, with dimensions CxHxW')
+        if not data_shape[0] == 3:
+            raise ValueError('This iterator expects inputs to have 3 channels.')
+
+    def check_valid_image(self, data):
+        """Checks if the input data is valid"""
+        if len(data[0].shape) == 0:
+            raise RuntimeError('Data shape is wrong')
+
+    def imdecode(self, s):
+        """Decodes a string or byte string to an NDArray.
+        See mx.img.imdecode for more details."""
+        img = mx.image.imdecode(s) #mx.ndarray
+        return img
+
+    def read_image(self, fname):
+        """Reads an input image `fname` and returns the decoded raw bytes.
+
+        Example usage:
+        ----------
+        >>> dataIter.read_image('Face.jpg') # returns decoded raw bytes.
+        """
+        with open(os.path.join(self.path_root, fname), 'rb') as fin:
+            img = fin.read()
+        return img
+
+    def augmentation_transform(self, data):
+        """Transforms input data with specified augmentation."""
+        for aug in self.auglist:
+            data = [ret for src in data for ret in aug(src)]
+        return data
+
+    def postprocess_data(self, datum):
+        """Final postprocessing step before image is loaded into the batch."""
+        return nd.transpose(datum, axes=(2, 0, 1))
 
 class FaceImageIter4(io.DataIter):
 
@@ -705,15 +1055,6 @@ class FaceImageIter4(io.DataIter):
         per_batch_size = int(batch_size/ctx_num)
         self.provide_label = [(label_name, (batch_size,))]
         self.batch_size = batch_size
-        self.ctx_num = ctx_num 
-        self.images_per_identity = images_per_identity
-        self.identities = int(per_batch_size/self.images_per_identity)
-        self.min_per_identity = 10
-        if self.images_per_identity<=10:
-          self.min_per_identity = self.images_per_identity
-        self.min_per_identity = 1
-        assert self.min_per_identity<=self.images_per_identity
-        print(self.images_per_identity, self.identities, self.min_per_identity)
         self.data_shape = data_shape
         self.shuffle = shuffle
         self.image_size = '%d,%d'%(data_shape[1],data_shape[2])
@@ -748,6 +1089,15 @@ class FaceImageIter4(io.DataIter):
           print(self.extra)
         else:
           self.provide_data = [(data_name, (batch_size,) + data_shape)]
+        self.ctx_num = ctx_num 
+        self.images_per_identity = images_per_identity
+        self.identities = int(per_batch_size/self.images_per_identity)
+        self.min_per_identity = 10
+        if self.images_per_identity<=10:
+          self.min_per_identity = self.images_per_identity
+        self.min_per_identity = 1
+        assert self.min_per_identity<=self.images_per_identity
+        print(self.images_per_identity, self.identities, self.min_per_identity)
 
         if aug_list is None:
             self.auglist = mx.image.CreateAugmenter(data_shape, **kwargs)
@@ -893,25 +1243,14 @@ class FaceImageIter4(io.DataIter):
             while i < batch_size:
                 label, s, bbox, landmark = self.next_sample()
                 _data = self.imdecode(s)
-                #_data = self.augmentation_transform([_data])[0]
-                _npdata = _data.asnumpy()
-                if landmark is not None:
-                  _npdata = face_preprocess.preprocess(_npdata, bbox = bbox, landmark=landmark, image_size=self.image_size)
                 if self.rand_mirror:
                   _rd = random.randint(0,1)
                   if _rd==1:
-                    for c in xrange(_npdata.shape[2]):
-                      _npdata[:,:,c] = np.fliplr(_npdata[:,:,c])
-                if self.mean is not None:
-                  _npdata = _npdata.astype(np.float32)
-                  _npdata -= self.mean
-                  _npdata *= 0.0078125
-                nimg = np.zeros(_npdata.shape, dtype=np.float32)
-                nimg[self.patch[1]:self.patch[3],self.patch[0]:self.patch[2],:] = _npdata[self.patch[1]:self.patch[3], self.patch[0]:self.patch[2], :]
-                #print(_npdata.shape)
-                #print(_npdata)
-                _data = mx.nd.array(nimg)
-                #print(_data.shape)
+                    _data = mx.ndarray.flip(data=_data, axis=1)
+                if self.nd_mean is not None:
+                    _data = _data.astype('float32')
+                    _data -= self.nd_mean
+                    _data *= 0.0078125
                 data = [_data]
                 try:
                     self.check_valid_image(data)
diff --git a/src/lfw.py b/src/eval/lfw.py
similarity index 71%
rename from src/lfw.py
rename to src/eval/lfw.py
index 0ea902b..7400769 100644
--- a/src/lfw.py
+++ b/src/eval/lfw.py
@@ -34,7 +34,10 @@ from sklearn.model_selection import KFold
 from scipy import interpolate
 import sklearn
 from sklearn.decomposition import PCA
-#import facenet
+import mxnet as mx
+from mxnet import ndarray as nd
+
+
 
 def calculate_roc(thresholds, embeddings1, embeddings2, actual_issame, nrof_folds=10, pca = 0):
     assert(embeddings1.shape[0] == embeddings2.shape[0])
@@ -186,5 +189,89 @@ def read_pairs(pairs_filename):
             pairs.append(pair)
     return np.array(pairs)
 
+def load_dataset(lfw_dir, image_size):
+  lfw_pairs = read_pairs(os.path.join(lfw_dir, 'pairs.txt'))
+  lfw_paths, issame_list = get_paths(lfw_dir, lfw_pairs, 'jpg')
+  lfw_data_list = []
+  for flip in [0,1]:
+    lfw_data = nd.empty((len(lfw_paths), 3, image_size[0], image_size[1]))
+    lfw_data_list.append(lfw_data)
+  i = 0
+  for path in lfw_paths:
+    with open(path, 'rb') as fin:
+      _bin = fin.read()
+      img = mx.image.imdecode(_bin)
+      img = nd.transpose(img, axes=(2, 0, 1))
+      for flip in [0,1]:
+        if flip==1:
+          img = mx.ndarray.flip(data=img, axis=2)
+        lfw_data_list[flip][i][:] = img
+      i+=1
+      if i%1000==0:
+        print('loading lfw', i)
+  print(lfw_data_list[0].shape)
+  print(lfw_data_list[1].shape)
+  return (lfw_data_list, issame_list)
 
+def test(lfw_set, mx_model, batch_size):
+  print('testing lfw..')
+  lfw_data_list = lfw_set[0]
+  issame_list = lfw_set[1]
+  model = mx_model
+  embeddings_list = []
+  for i in xrange( len(lfw_data_list) ):
+    lfw_data = lfw_data_list[i]
+    embeddings = None
+    ba = 0
+    while ba<lfw_data.shape[0]:
+      bb = min(ba+batch_size, lfw_data.shape[0])
+      _data = nd.slice_axis(lfw_data, axis=0, begin=ba, end=bb)
+      _label = nd.ones( (bb-ba,) )
+      #print(_data.shape, _label.shape)
+      db = mx.io.DataBatch(data=(_data,), label=(_label,))
+      model.forward(db, is_train=False)
+      net_out = model.get_outputs()
+      #_arg, _aux = model.get_params()
+      #__arg = {}
+      #for k,v in _arg.iteritems():
+      #  __arg[k] = v.as_in_context(_ctx)
+      #_arg = __arg
+      #_arg["data"] = _data.as_in_context(_ctx)
+      #_arg["softmax_label"] = _label.as_in_context(_ctx)
+      #for k,v in _arg.iteritems():
+      #  print(k,v.context)
+      #exe = sym.bind(_ctx, _arg ,args_grad=None, grad_req="null", aux_states=_aux)
+      #exe.forward(is_train=False)
+      #net_out = exe.outputs
+      _embeddings = net_out[0].asnumpy()
+      #print(_embeddings.shape)
+      if embeddings is None:
+        embeddings = np.zeros( (lfw_data.shape[0], _embeddings.shape[1]) )
+      embeddings[ba:bb,:] = _embeddings
+      ba = bb
+    embeddings_list.append(embeddings)
+
+  _xnorm = 0.0
+  _xnorm_cnt = 0
+  for embed in embeddings_list:
+    for i in xrange(embed.shape[0]):
+      _em = embed[i]
+      _norm=np.linalg.norm(_em)
+      #print(_em.shape, _norm)
+      _xnorm+=_norm
+      _xnorm_cnt+=1
+  _xnorm /= _xnorm_cnt
+
+  embeddings = embeddings_list[0].copy()
+  embeddings = sklearn.preprocessing.normalize(embeddings)
+  _, _, accuracy, val, val_std, far = evaluate(embeddings, issame_list, nrof_folds=10)
+  acc1, std1 = np.mean(accuracy), np.std(accuracy)
+  #print('Validation rate: %2.5f+-%2.5f @ FAR=%2.5f' % (val, val_std, far))
+  #embeddings = np.concatenate(embeddings_list, axis=1)
+  embeddings = embeddings_list[0] + embeddings_list[1]
+  embeddings = sklearn.preprocessing.normalize(embeddings)
+  print(embeddings.shape)
+  _, _, accuracy, val, val_std, far = evaluate(embeddings, issame_list, nrof_folds=10)
+  acc2, std2 = np.mean(accuracy), np.std(accuracy)
+  return acc1, std1, acc2, std2, _xnorm, embeddings_list
 
diff --git a/src/marginalnet.py b/src/marginalnet.py
index 4e8ba3e..dc44482 100644
--- a/src/marginalnet.py
+++ b/src/marginalnet.py
@@ -1,3 +1,6 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
 import mxnet as mx
 import numpy as np
 
@@ -133,18 +136,29 @@ def resnet_unit6(data, num_filter, name, dim_match=True, workspace = 256):
   return body
 
 def resnet_unit7(data, num_filter, name, dim_match=True, workspace = 256):
+  #se block
   bn_mom = 0.9
   shortcut = data
-  body = Conv(data=data, num_filter=num_filter, kernel=(3,3), stride=(1,1), pad=(1, 1), num_group=32,
+  body = mx.sym.BatchNorm(data=data, fix_gamma=False, eps=2e-5, momentum=bn_mom, name=name+'_bn1')
+  body = Conv(data=body, num_filter=num_filter, kernel=(3,3), stride=(1,1), pad=(1, 1),
                             name=name+"_conv1", workspace=workspace)
-  body = mx.sym.BatchNorm(data=body, fix_gamma=False, eps=2e-5, momentum=bn_mom, name=name+'_bn1')
-  body = Act(data=body, name=name+'_relu1')
-  body = Conv(data=body, num_filter=num_filter, kernel=(3,3), stride=(1,1), pad=(1, 1), num_group=32,
-                            name=name+"_conv2", workspace=workspace)
   body = mx.sym.BatchNorm(data=body, fix_gamma=False, eps=2e-5, momentum=bn_mom, name=name+'_bn2')
+  body = Act(data=body, name=name+'_relu1')
+  body = Conv(data=body, num_filter=num_filter, kernel=(3,3), stride=(1,1), pad=(1, 1),
+                            name=name+"_conv2", workspace=workspace)
+  res = mx.sym.BatchNorm(data=body, fix_gamma=False, eps=2e-5, momentum=bn_mom, name=name+'_bn3')
+
+  body = mx.sym.Pooling(data=res, global_pool=True, kernel=(7, 7), pool_type='avg', name=name+'_se_pool1')
+  body = Conv(data=body, num_filter=num_filter//16, kernel=(1,1), stride=(1,1), pad=(0,0),
+                            name=name+"_se_conv1", workspace=workspace)
+  body = Act(data=body, name=name+'_se_relu1')
+  body = Conv(data=body, num_filter=num_filter, kernel=(1,1), stride=(1,1), pad=(0,0),
+                            name=name+"_se_conv2", workspace=workspace)
+  body = mx.symbol.Activation(data=body, act_type='sigmoid', name=name+"_se_sigmoid")
+  body = mx.symbol.broadcast_mul(res, body)
+
   if dim_match:
     body = body+shortcut
-  body = Act(data=body, name=name+'_relu2')
   return body
 
 def resnet_unit100(data, num_filter, name, dim_match=True, workspace = 256):
@@ -231,6 +245,9 @@ def get_symbol(num_classes, num_layers, conv_workspace=256):
       rtype = 3
     elif num_layers==52:
       filter_list = [64, 256, 512, 1024]
+      units = [2,3,15,3]
+      rtype = 3
+    elif num_layers==53: #se block
       units = [2,3,15,3]
       rtype = 7
     elif num_layers==74:
diff --git a/src/train_softmax.py b/src/train_softmax.py
index 15e334d..d74b77c 100644
--- a/src/train_softmax.py
+++ b/src/train_softmax.py
@@ -9,6 +9,7 @@ import random
 import logging
 import numpy as np
 from data import FaceIter
+from data import FaceImageIter
 from data import FaceImageIter2
 from data import FaceImageIter4
 from data import FaceImageIter5
@@ -16,7 +17,8 @@ import mxnet as mx
 from mxnet import ndarray as nd
 import argparse
 import mxnet.optimizer as optimizer
-sys.path.append(os.path.join(os.path.dirname(__file__), '..', 'common'))
+#sys.path.append(os.path.join(os.path.dirname(__file__), 'common'))
+sys.path.append(os.path.join(os.path.dirname(__file__), 'eval'))
 import spherenet
 import marginalnet
 import inceptions
@@ -113,6 +115,8 @@ def parse_args():
       help='feature incay')
   parser.add_argument('--use-deformable', type=int, default=0,
       help='')
+  parser.add_argument('--image-size', type=str, default='112,96',
+      help='')
   parser.add_argument('--patch', type=str, default='0_0_96_112_0',
       help='')
   parser.add_argument('--lr-steps', type=str, default='',
@@ -126,7 +130,7 @@ def get_symbol(args, arg_params, aux_params):
     new_args = arg_params
   else:
     new_args = None
-  data_shape = (args.image_channel,112,96)
+  data_shape = (args.image_channel,args.image_h,args.image_w)
   image_shape = ",".join([str(x) for x in data_shape])
   if args.network[0]=='s':
     embedding = spherenet.get_symbol(512, args.num_layers)
@@ -269,6 +273,9 @@ def train_net(args):
     args.rescale_threshold = 0
     args.image_channel = 3
     ppatch = [int(x) for x in args.patch.split('_')]
+    image_size = [int(x) for x in args.image_size.split(',')]
+    args.image_h = image_size[0]
+    args.image_w = image_size[1]
     assert len(ppatch)==5
     #if args.patch%2==1:
     #  args.image_channel = 1
@@ -291,7 +298,10 @@ def train_net(args):
     #path_imglist = "/raid5data/dplearn/MS-Celeb-Aligned/lst2"
     path_imgrec = os.path.join(args.data_dir, "train.rec")
     val_rec = os.path.join(args.data_dir, "val.rec")
-    args.use_val = True
+    if os.path.exists(val_rec):
+      args.use_val = True
+    else:
+      val_rec = None
     #args.num_classes = 10572 #webface
     #args.num_classes = 81017
     #args.num_classes = 82395
@@ -304,21 +314,19 @@ def train_net(args):
 
     print('Called with argument:', args)
 
-    data_shape = (args.image_channel,112,96)
+    data_shape = (args.image_channel,image_size[0],image_size[1])
     #mean = [127.5,127.5,127.5]
     mean = None
 
     if args.use_val:
-      val_dataiter = FaceImageIter2(
+      val_dataiter = FaceImageIter(
           batch_size           = args.batch_size,
           data_shape           = data_shape,
           path_imgrec          = val_rec,
           #path_imglist         = val_path,
           shuffle              = False,
-          exclude_lfw          = False,
           rand_mirror          = False,
           mean                 = mean,
-          patch                = ppatch,
       )
     else:
       val_dataiter = None
@@ -367,20 +375,13 @@ def train_net(args):
 
 
     if args.loss_type<=9:
-      train_dataiter = FaceImageIter2(
+      train_dataiter = FaceImageIter(
           batch_size           = args.batch_size,
           data_shape           = data_shape,
           path_imgrec          = path_imgrec,
-          path_imglist         = path_imglist,
           shuffle              = True,
-          exclude_lfw          = False,
           rand_mirror          = True,
-          brightness           = 0.4,
-          contrast             = 0.4,
-          saturation           = 0.4,
-          pca_noise            = 0.1,
           mean                 = mean,
-          patch                = ppatch,
       )
     elif args.loss_type==10:
       train_dataiter = FaceImageIter4(
@@ -391,7 +392,6 @@ def train_net(args):
           path_imglist         = path_imglist,
           shuffle              = True,
           rand_mirror          = True,
-          exclude_lfw          = False,
           mean                 = mean,
           patch                = ppatch,
           use_extra            = True,
@@ -406,7 +406,6 @@ def train_net(args):
           path_imglist         = path_imglist,
           shuffle              = True,
           rand_mirror          = True,
-          exclude_lfw          = False,
           mean                 = mean,
           patch                = ppatch,
       )
@@ -461,124 +460,14 @@ def train_net(args):
     _cb = mx.callback.Speedometer(args.batch_size, 10)
 
     lfw_dir = os.path.join(args.data_dir,'lfw')
-    lfw_pairs = lfw.read_pairs(os.path.join(lfw_dir, 'pairs.txt'))
-    lfw_paths, issame_list = lfw.get_paths(lfw_dir, lfw_pairs, 'jpg')
-    imgs = []
-    lfw_data_list = []
-    for flip in [0,1]:
-      lfw_data = nd.empty((len(lfw_paths), args.image_channel, 112, 96))
-      lfw_data_list.append(lfw_data)
-    i = 0
-
-    for path in lfw_paths:
-      with open(path, 'rb') as fin:
-        _bin = fin.read()
-        if ppatch[4]%2==1:
-          img = mx.image.imdecode(_bin, flag=0)
-          if img.shape[2]<args.image_channel:
-            img = nd.broadcast_to(img, (img.shape[0], img.shape[1], 3))
-        else:
-          img = mx.image.imdecode(_bin)
-        img = nd.transpose(img, axes=(2, 0, 1))
-        img = img.asnumpy()
-        #print(img.shape)
-        if mean is not None:
-          img = img.astype(np.float32)
-          img -= np.array(mean, dtype=np.float32).reshape(args.image_channel,1,1)
-          img *= 0.0078125
-        for flip in [0,1]:
-          _img = img.copy()
-          if flip==1:
-            #_img = _img.asnumpy()
-            for c in xrange(_img.shape[0]):
-              _img[c,:,:] = np.fliplr(_img[c,:,:])
-            #_img = nd.array( _img )
-          #print(img.shape)
-          nimg = np.zeros(_img.shape, dtype=np.float32)
-          nimg[:,ppatch[1]:ppatch[3],ppatch[0]:ppatch[2]] = _img[:, ppatch[1]:ppatch[3], ppatch[0]:ppatch[2]]
-          lfw_data_list[flip][i][:] = nd.array(nimg)
-        i+=1
-        if i%1000==0:
-          print('loading lfw', i)
-    print(lfw_data_list[0].shape)
-    print(lfw_data_list[1].shape)
+    lfw_set = lfw.load_dataset(lfw_dir, image_size)
 
     def lfw_test(nbatch):
-      print('testing lfw..')
-      #GLOBAL_STEP = nbatch
-      #return 0.1
-      embeddings_list = []
-      for i in xrange( len(lfw_data_list) ):
-        lfw_data = lfw_data_list[i]
-        embeddings = None
-        ba = 0
-        _ctx = ctx[0]
-        while ba<lfw_data.shape[0]:
-          bb = min(ba+args.batch_size, lfw_data.shape[0])
-          _data = nd.slice_axis(lfw_data, axis=0, begin=ba, end=bb)
-          _label = nd.ones( (bb-ba,) )
-          #print(_data.shape, _label.shape)
-          db = mx.io.DataBatch(data=(_data,), label=(_label,))
-          model.forward(db, is_train=False)
-          net_out = model.get_outputs()
-          #_arg, _aux = model.get_params()
-          #__arg = {}
-          #for k,v in _arg.iteritems():
-          #  __arg[k] = v.as_in_context(_ctx)
-          #_arg = __arg
-          #_arg["data"] = _data.as_in_context(_ctx)
-          #_arg["softmax_label"] = _label.as_in_context(_ctx)
-          #for k,v in _arg.iteritems():
-          #  print(k,v.context)
-          #exe = sym.bind(_ctx, _arg ,args_grad=None, grad_req="null", aux_states=_aux)
-          #exe.forward(is_train=False)
-          #net_out = exe.outputs
-          _embeddings = net_out[0].asnumpy()
-          #print(_embeddings.shape)
-          if embeddings is None:
-            embeddings = np.zeros( (lfw_data.shape[0], _embeddings.shape[1]) )
-          embeddings[ba:bb,:] = _embeddings
-          ba = bb
-        embeddings_list.append(embeddings)
-
-      _xnorm = 0.0
-      _xnorm_cnt = 0
-      for embed in embeddings_list:
-        for i in xrange(embed.shape[0]):
-          _em = embed[i]
-          _norm=np.linalg.norm(_em)
-          #print(_em.shape, _norm)
-          _xnorm+=_norm
-          _xnorm_cnt+=1
-      _xnorm /= _xnorm_cnt
-      print('[%d]XNorm: %f' % (nbatch, _xnorm))
-
-      acc_list = []
-      embeddings = embeddings_list[0].copy()
-      embeddings = sklearn.preprocessing.normalize(embeddings)
-      _, _, accuracy, val, val_std, far = lfw.evaluate(embeddings, issame_list, nrof_folds=10)
-      acc_list.append(np.mean(accuracy))
-      print('[%d]Accuracy: %1.5f+-%1.5f' % (nbatch, np.mean(accuracy), np.std(accuracy)))
-      #print('Validation rate: %2.5f+-%2.5f @ FAR=%2.5f' % (val, val_std, far))
-      #embeddings = np.concatenate(embeddings_list, axis=1)
-      embeddings = embeddings_list[0] + embeddings_list[1]
-      embeddings = sklearn.preprocessing.normalize(embeddings)
-      print(embeddings.shape)
-      _, _, accuracy, val, val_std, far = lfw.evaluate(embeddings, issame_list, nrof_folds=10)
-      acc_list.append(np.mean(accuracy))
-      print('[%d]Accuracy-Flip: %1.5f+-%1.5f' % (nbatch, np.mean(accuracy), np.std(accuracy)))
-      racc = acc_list[1]
-      #racc = max(*acc_list)
-      #print('Validation rate: %2.5f+-%2.5f @ FAR=%2.5f' % (val, val_std, far))
-      #pca = PCA(n_components=128)
-      #embeddings = pca.fit_transform(embeddings)
-      #embeddings = sklearn.preprocessing.normalize(embeddings)
-      #print(embeddings.shape)
-      #_, _, accuracy, val, val_std, far = lfw.evaluate(embeddings, issame_list, nrof_folds=10)
-      #acc_list.append(np.mean(accuracy))
-      #print('[%d]Accuracy-PCA: %1.3f+-%1.3f' % (nbatch, np.mean(accuracy), np.std(accuracy)))
-      #print('Validation rate: %2.5f+-%2.5f @ FAR=%2.5f' % (val, val_std, far))
-      return racc, embeddings_list
+      acc1, std1, acc2, std2, xnorm, embeddings_list = lfw.test(lfw_set, model, args.batch_size)
+      print('[%d]XNorm: %f' % (nbatch, xnorm))
+      print('[%d]Accuracy: %1.5f+-%1.5f' % (nbatch, acc1, std1))
+      print('[%d]Accuracy-Flip: %1.5f+-%1.5f' % (nbatch, acc2, std2))
+      return acc2, embeddings_list
 
 
     def val_test():
@@ -600,7 +489,7 @@ def train_net(args):
     save_step = [0]
     if len(args.lr_steps)==0:
       #lr_steps = [40000, 70000, 90000]
-      lr_steps = [30000, 50000, 70000, 90000]
+      lr_steps = [40000, 60000, 80000]
       if args.loss_type==1:
         lr_steps = [100000, 140000, 160000]
     else: