划分自己的训练集和验证集代码

import os
import random
import shutil

images_path = "/Media/E/NEU-DET/data/neu/train2020"
annos_path = "/Media/E/NEU-DET/data/neu/ANNOTATIONS_TRAIN"

file_name = os.listdir(images_path)
file_A = file_name[:300]
file_B = file_name[300:600]
file_C = file_name[600:900]
file_D = file_name[900:1200]
file_E = file_name[1200:1500]
file_F = file_name[1500:]

image_path_A = []
image_path_B = []
image_path_C = []
image_path_D = []
image_path_E = []
image_path_F = []
# anno_path_A = []
# anno_path_B = []
# anno_path_C = []
# anno_path_D = []
# anno_path_E = []
# anno_path_F = []

for img_name in file_A:
    image_path_A.append(os.path.join(images_path, img_name))
random.shuffle(image_path_A)
image_path_A = image_path_A[:30]
for i in image_path_A:
    anno_path_A = i.replace("jpg", "xml").replace("train2020", "ANNOTATIONS_TRAIN")
    shutil.move(i, "/Media/E/NEU-DET/data/neu/val2020/")
    shutil.move(anno_path_A, "/Media/E/NEU-DET/data/neu/ANNOTATIONS_VAL")

for img_name in file_B:
    image_path_B.append(os.path.join(images_path, img_name))
random.shuffle(image_path_B)
image_path_B = image_path_B[:30]
for i in image_path_B:
    anno_path_B = i.replace("jpg", "xml").replace("train2020", "ANNOTATIONS_TRAIN")
    shutil.move(i, "/Media/E/NEU-DET/data/neu/val2020/")
    shutil.move(anno_path_B, "/Media/E/NEU-DET/data/neu/ANNOTATIONS_VAL")

for img_name in file_C:
    image_path_C.append(os.path.join(images_path, img_name))
random.shuffle(image_path_C)
image_path_C = image_path_C[:30]
for i in image_path_C:
    anno_path_C = i.replace("jpg", "xml").replace("train2020", "ANNOTATIONS_TRAIN")
    shutil.move(i, "/Media/E/NEU-DET/data/neu/val2020/")
    shutil.move(anno_path_C, "/Media/E/NEU-DET/data/neu/ANNOTATIONS_VAL")

for img_name in file_D:
    image_path_D.append(os.path.join(images_path, img_name))
random.shuffle(image_path_D)
image_path_D = image_path_D[:30]
for i in image_path_D:
    anno_path_D = i.replace("jpg", "xml").replace("train2020", "ANNOTATIONS_TRAIN")
    shutil.move(i, "/Media/E/NEU-DET/data/neu/val2020/")
    shutil.move(anno_path_D, "/Media/E/NEU-DET/data/neu/ANNOTATIONS_VAL")

for img_name in file_E:
    image_path_E.append(os.path.join(images_path, img_name))
random.shuffle(image_path_E)
image_path_E = image_path_E[:30]
for i in image_path_E:
    anno_path_E = i.replace("jpg", "xml").replace("train2020", "ANNOTATIONS_TRAIN")
    shutil.move(i, "/Media/E/NEU-DET/data/neu/val2020/")
    shutil.move(anno_path_E, "/Media/E/NEU-DET/data/neu/ANNOTATIONS_VAL")

for img_name in file_F:
    image_path_F.append(os.path.join(images_path, img_name))
random.shuffle(image_path_F)
image_path_F = image_path_F[:30]
for i in image_path_F:
    anno_path_F = i.replace("jpg", "xml").replace("train2020", "ANNOTATIONS_TRAIN")
    shutil.move(i, "/Media/E/NEU-DET/data/neu/val2020/")
    shutil.move(anno_path_F, "/Media/E/NEU-DET/data/neu/ANNOTATIONS_VAL")

我的数据集是1800张图片,6个类别,每个类别300张,划分时,每个类别划出了30张,验证集一共180张图片,连同标注文件一起分开,这里标注文件时xml格式。

  • 2
    点赞
  • 5
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值