1.保存19类
path='19'
path2='源文件'
path3='1'
f = open(path, "a")
f2 = open(path2, "r")
f3 = open(path3,"a")
for i in range(5011):
a=f2.readline()
if a[7:9]==' 1':
f3.write(a[0:6]+'\n')
else:
f.write(a[0:6]+'\n')
print a
f.close()
f2.close()
f3.close()
2.保存10类
datapath='文件路径'
for i in range(10):
f1 = open(datapath+'test3.txt', "a")
f2 = open(datapath+VOC_BBOX_LABEL_NAMES[i]+'_test.txt', "r")
for i in range(4952):
a=f2.readline()
if a[7:9]==' 1':
f1.write(a[0:6]+'\n')
print a
f1.close()
f2.close()
3.去除重复
#coding:utf-8
import shutil
readDir = datapath+'源.txt'
writeDir = datapath+ "目标.txt"
lines_seen = set()
outfile=open(writeDir,"w")
f = open(readDir,"r")
for line in f:
if line not in lines_seen:
outfile.write(line)
lines_seen.add(line)
outfile.close()
print "success"
f.close()
4.创建每一类的样本名txt
#!/usr/bin/env python
# -*- coding:utf-8 -*-
import os
import xml.etree.ElementTree as ET
VOC_BBOX_LABEL_NAMES = (
# 'wbc',
# 'rbc',
'platelets'
)
data_dir='/media/chenli/G/BCCD'
files = os.listdir(data_dir+'/Annotations')
f = open('/media/chenli/G/BCCD/ImageSets/Main/'+VOC_BBOX_LABEL_NAMES+'.txt', "a")
for id_ in files:
anno = ET.parse(os.path.join(data_dir, 'Annotations', id_))
for obj in anno.findall('object'):
# when in not using difficult split, and the object is
# difficult, skipt it.
name = obj.find('name').text.lower().strip()
# print name
if name in VOC_BBOX_LABEL_NAMES:
f.write(id_[0:16]+'\n')
break
f.close()
5.分成train和test
#coding:utf-8
import shutil
writeDir= '/media/chenli/G/BCCD/ImageSets/Main/'+VOC_BBOX_LABEL_NAMES+'_all.txt'
writeDir1= '/media/chenli/G/BCCD/ImageSets/Main/'+VOC_BBOX_LABEL_NAMES+'.txt'
writeDir2= '/media/chenli/G/BCCD/ImageSets/Main/'+VOC_BBOX_LABEL_NAMES+'_test.txt'
readDir = '/media/chenli/G/BCCD/ImageSets/Main/trainval.txt'
lines_seen = set()
outfile=open(writeDir1,"w")
f = open(readDir,"r")
f2 = open(writeDir,"r")
outfile2=open(writeDir2,"w")
for line in f:
if line not in lines_seen:
lines_seen.add(line)
for line in f2:
if line in lines_seen:
outfile.write(line)
else:
outfile2.write(line)
outfile.close()
outfile2.close()
print "success"
f.close()
6.将一个文件的文本添加到另外一个文件中
f = open('1.txt', "r")
f2 = open('2.txt', "a")
f2.write(f.read())
f2.close()
f.close