Mxnet做图片分类训练的时候提供了多种输入,这里介绍.rec
数据的制作。
mxnet版本:0.904
1.收集图片
这里收集了两类图片,猫和狗的图片。
第一类
第二类
所有的图片放到两个文件夹中
2.生成mxnet训练需要的数据格式
如果mxnet自带的im2rec.py有问题,这里用的是另外的文件,文件名叫im2rec2.py,代码在最后面。
#生成.lst文件
python im2rec2.py --list True --exts .jpg --exts .jpeg --recusive=True --train-ratio 0.7 --test-ratio 0.3 train-cat ./train-cat
说明: python im2rec2.py 参数1 参数2 参数3 参数4 参数5 参数6 参数7...
参数1 --list:--list True 创建make_list
参数2 --exts: 需要查找的图像的扩展名
参数3 --train-ratio : 使用训练的图片的比例
参数4 --test-trtio : 使用测试的图片的比例
参数5 --recusive : 如果是true 就会递归寻找子目录的文件
参数6 train-cat : 输出lst和rec文件的前缀
参数7 ./train-cat : 包含图像文件夹目录的根目录
#生成.rec,im2rec需要编译生成,可以参考文献[1]
../bin/im2rec ./train-cat_train.lst train-cat/ train-cat_train.rec resize=224
说明:2. ../bin/im2rec 参数1 参数2 参数3 参数4 ...
参数1:train.lst,test.lst, or val.lst
参数2: 目录为trian-cat,则该参数为train-cat。这里还要和.lst文件结合
参数3:生成的文件名称 如:image.rec
后面的参数根据需求添加
train-cat_test.lst的生成方法一样,这里忽略了,同时也忽略了val数据的生存
# -*- coding: utf-8 -*-
from __future__ import print_function
import os
import sys
curr_path = os.path.abspath(os.path.dirname(__file__))
sys.path.append(os.path.join(curr_path, "../python"))
import mxnet as mx
import random
import argparse
import cv2
import time
def list_image(root, recursive, exts):
print (root)
print('exts ',exts)
image_list = []
if recursive:
cat = {}
for path, subdirs, files in os.walk(root, followlinks=True):
subdirs.sort()
print(len(cat), path)
for fname in files:
fpath = os.path.join(path, fname)
#print ('ddd :',fpath)
suffix = os.path.splitext(fname)[1].lower()
#print(suffix)
if os.path.isfile(fpath) and (suffix in exts):
if path not in cat:
cat[path] = len(cat)
yield (len(image_list), os.path.relpath(fpath, root), cat[path])
else:
for fname in os.listdir(root):
fpath = os.path.join(root, fname)
suffix = os.path.splitext(fname)[1].lower()
if os.path.isfile(fpath) and (suffix in exts):
yield (len(image_list), os.path.relpath(fpath, root), 0)
def write_list(path_out, image_list):
with open(path_out, 'w') as fout:
for i, item in enumerate(image_list):
line = '%d\t' % item[0]
for j in item[2:]:
line += '%f\t' % j
line += '%s\n' % item[1]
fout.write(line)
def make_list(args):
image_list = list_image(args.root, args.recursive, args.exts)
image_list = list(image_list)
if args.shuffle is True:
random.seed(100)
random.shuffle(image_list)
N = len(image_list)
chunk_size = (N + args.chunks - 1) / args.chunks
for i in xrange(args.chunks):
chunk = image_list[i * chunk_size:(i + 1) * chunk_size]
if args.chunks > 1:
str_chunk = '_%d' % i
else:
str_chunk = ''
sep = int(chunk_size * args.train_ratio)
sep_test = int(chunk_size * args.test_ratio)
write_list(args.prefix + str_chunk + '_test.lst', chunk[:sep_test])
write_list(args.prefix + str_chunk + '_train.lst', chunk[sep_test:sep_test + sep])
write_list(args.prefix + str_chunk + '_val.lst', chunk[sep_test + sep:])
def read_list(path_in):
with open(path_in) as fin:
while True:
line = fin.readline()
if not line:
break
line = [i.strip() for i in line.strip().split('\t')]
item = [int(line[0])] + [line[-1]] + [float(i) for i in line[1:-1]]
yield item
def image_encode(args, item, q_out):
try:
img = cv2.imread(os.path.join(args.root, item[1]), args.color)
except:
print('imread error:', item[1])
return
if img is None:
print('read none error:', item[1])
return
if args.center_crop:
if img.shape[0] > img.shape[1]:
margin = (img.shape[0] - img.shape[1]) / 2;
img = img[margin:margin + img.shape[1], :]
else:
margin = (img.shape[1] - img.shape[0]) / 2;
img = img[:, margin:margin + img.shape[0]]
if args.resize:
if img.shape[0] > img.shape[1]:
newsize = (args.resize, img.shape[0] * args.resize / img.shape[1])
else:
newsize = (img.shape[1] * args.resize / img.shape[0], args.resize)
img = cv2.resize(img, newsize)
if len(item) > 3 and args.pack_label:
header = mx.recordio.IRHeader(0, item[2:], item[0], 0)
else:
header = mx.recordio.IRHeader(0, item[2], item[0], 0)
try:
s = mx.recordio.pack_img(header, img, quality=args.quality, img_fmt=args.encoding)
q_out.put((s, item))
except Exception, e:
print('pack_img error:', item[1], e)
return
def read_worker(args, q_in, q_out):
while True:
item = q_in.get()
if item is None:
break
image_encode(args, item, q_out)
def write_worker(q_out, fname, working_dir):
pre_time = time.time()
count = 0
fname_rec = os.path.basename(fname)
fname_rec = os.path.splitext(fname)[0] + '.rec'
fout = open(fname+'.tmp', 'w')
record = mx.recordio.MXRecordIO(os.path.join(working_dir, fname_rec), 'w')
while True:
deq = q_out.get()
if deq is None:
break
s, item = deq
record.write(s)
line = '%d\t' % item[0]
for j in item[2:]:
line += '%f\t' % j
line += '%s\n' % item[1]
fout.write(line)
if count % 1000 == 0:
cur_time = time.time()
print('time:', cur_time - pre_time, ' count:', count)
pre_time = cur_time
count += 1
os.rename(fname+'.tmp', fname)
def parse_args():
parser = argparse.ArgumentParser(
formatter_class=argparse.ArgumentDefaultsHelpFormatter,
description='Create an image list or \
make a record database by reading from an image list')
parser.add_argument('prefix', help='prefix of input/output lst and rec files.')
parser.add_argument('root', help='path to folder containing images.')
cgroup = parser.add_argument_group('Options for creating image lists')
cgroup.add_argument('--list', type=bool, default=False,
help='If this is set im2rec will create image list(s) by traversing root folder\
and output to <prefix>.lst.\
Otherwise im2rec will read <prefix>.lst and create a database at <prefix>.rec')
cgroup.add_argument('--exts', type=list,action='append',default=['.jpeg', '.jpg','.bmp'],
help='list of acceptable image extensions.')
cgroup.add_argument('--chunks', type=int, default=1, help='number of chunks.')
cgroup.add_argument('--train-ratio', type=float, default=1.0,
help='Ratio of images to use for training.')
cgroup.add_argument('--test-ratio', type=float, default=0,
help='Ratio of images to use for testing.')
cgroup.add_argument('--recursive', type=bool, default=False,
help='If true recursively walk through subdirs and assign an unique label\
to images in each folder. Otherwise only include images in the root folder\
and give them label 0.')
rgroup = parser.add_argument_group('Options for creating database')
rgroup.add_argument('--resize', type=int, default=0,
help='resize the shorter edge of image to the newsize, original images will\
be packed by default.')
rgroup.add_argument('--center-crop', type=bool, default=False,
help='specify whether to crop the center image to make it rectangular.')
rgroup.add_argument('--quality', type=int, default=80,
help='JPEG quality for encoding, 1-100; or PNG compression for encoding, 1-9')
rgroup.add_argument('--num-thread', type=int, default=1,
help='number of thread to use for encoding. order of images will be different\
from the input list if >1. the input list will be modified to match the\
resulting order.')
rgroup.add_argument('--color', type=int, default=1, choices=[-1, 0, 1],
help='specify the color mode of the loaded image.\
1: Loads a color image. Any transparency of image will be neglected. It is the default flag.\
0: Loads image in grayscale mode.\
-1:Loads image as such including alpha channel.')
rgroup.add_argument('--encoding', type=str, default='.jpg', choices=['.jpg', '.png'],
help='specify the encoding of the images.')
rgroup.add_argument('--shuffle', default=True, help='If this is set as True, \
im2rec will randomize the image order in <prefix>.lst')
rgroup.add_argument('--pack-label', default=False,
help='Whether to also pack multi dimensional label in the record file')
args = parser.parse_args()
args.prefix = os.path.abspath(args.prefix)
args.root = os.path.abspath(args.root)
return args
if __name__ == '__main__':
args = parse_args()
if args.list:
make_list(args)
print('ddd',args.prefix)
else:
if os.path.isdir(args.prefix):
working_dir = args.prefix
else:
working_dir = os.path.dirname(args.prefix)
files = [os.path.join(working_dir, fname) for fname in os.listdir(working_dir)
if os.path.isfile(os.path.join(working_dir, fname))]
count = 0
for fname in files:
if fname.startswith(args.prefix) and fname.endswith('.lst'):
print('Creating .rec file from', fname, 'in', working_dir)
count += 1
image_list = read_list(fname)
# -- write_record -- #
try:
import multiprocessing
q_in = [multiprocessing.Queue(1024) for i in range(args.num_thread)]
q_out = multiprocessing.Queue(1024)
read_process = [multiprocessing.Process(target=read_worker, args=(args, q_in[i], q_out)) \
for i in range(args.num_thread)]
for p in read_process:
p.start()
write_process = multiprocessing.Process(target=write_worker, args=(q_out, fname, working_dir))
write_process.start()
for i, item in enumerate(image_list):
q_in[i % len(q_in)].put(item)
for q in q_in:
q.put(None)
for p in read_process:
p.join()
q_out.put(None)
write_process.join()
except ImportError:
print('multiprocessing not available, fall back to single threaded encoding')
import Queue
q_out = Queue.Queue()
fname_rec = os.path.basename(fname)
fname_rec = os.path.splitext(fname)[0] + '.rec'
record = mx.recordio.MXRecordIO(os.path.join(working_dir, fname_rec), 'w')
cnt = 0
pre_time = time.time()
for item in image_list:
image_encode(args, item, q_out)
if q_out.empty():
continue
_, s, _ = q_out.get()
record.write(s)
if cnt % 1000 == 0:
cur_time = time.time()
print('time:', cur_time - pre_time, ' count:', cnt)
pre_time = cur_time
cnt += 1
if not count:
print('Did not find and list file with prefix %s'%args.prefix)
参考文献:
[1] http://mxnet.io/api/scala/io.html?highlight=im2rec