diff --git a/recognition/data/rec2image.py b/recognition/data/rec2image.py
new file mode 100644
index 0000000..535df24
--- /dev/null
+++ b/recognition/data/rec2image.py
@@ -0,0 +1,63 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+import os
+import sys
+import mxnet as mx
+from mxnet import ndarray as nd
+import random
+import argparse
+import cv2
+import time
+import sklearn
+import numpy as np
+
+
+def main(args):
+  include_datasets = args.include.split(',')
+  rec_list = []
+  for ds in include_datasets:
+    path_imgrec = os.path.join(ds, 'train.rec')
+    path_imgidx = os.path.join(ds, 'train.idx')
+    imgrec = mx.recordio.MXIndexedRecordIO(path_imgidx, path_imgrec, 'r')  # pylint: disable=redefined-variable-type
+    rec_list.append(imgrec)
+  if not os.path.exists(args.output):
+    os.makedirs(args.output)
+  for ds_id in range(len(rec_list)):
+    id_list = []
+    imgrec = rec_list[ds_id]
+    s = imgrec.read_idx(0)
+    header, _ = mx.recordio.unpack(s)
+    assert header.flag>0
+    print('header0 label', header.label)
+    header0 = (int(header.label[0]), int(header.label[1]))
+    seq_identity = range(int(header.label[0]), int(header.label[1]))
+    pp=0
+    for identity in seq_identity:
+      id_dir = os.path.join(args.output, "%d_%d"%(ds_id, identity))
+      os.makedirs(id_dir)
+      pp+=1
+      if pp%10==0:
+        print('processing id', pp)
+      s = imgrec.read_idx(identity)
+      header, _ = mx.recordio.unpack(s)
+      imgid = 0
+      for _idx in range(int(header.label[0]), int(header.label[1])):
+        s = imgrec.read_idx(_idx)
+        _header, _img = mx.recordio.unpack(s)
+        _img = mx.image.imdecode(_img).asnumpy()[:,:,::-1] # to bgr
+        image_path = os.path.join(id_dir, "%d.jpg"%imgid)
+        cv2.imwrite(image_path, _img)
+        imgid+=1
+
+
+
+
+if __name__ == '__main__':
+  parser = argparse.ArgumentParser(description='do dataset merge')
+  # general
+  parser.add_argument('--include', default='', type=str, help='')
+  parser.add_argument('--output', default='', type=str, help='')
+  args = parser.parse_args()
+  main(args)
+