1、全文根据TotalText数据集进行处理,txt文档打开后格式:
每一个line只有前两个元素x,y为所需坐标,故只对x,y进行处理
2、基本思路为提取x,y中最大最小的坐标形成一个box,每个box则包含所有的标记
3、code如下:
# -*- coding: UTF-8 -*-
#根据数据集批量截取图片并保存
import numpy as np
import glob as glob
import cv2
import os
from PIL import Image
import os
import time
import matplotlib.pyplot as plt
def main():
path_txt = "~/下载/TotalText/examples/txt/traintrain/"
count=1
for f in os.listdir(path_txt):
f = open(path_txt + f,'r')
lines = f.readlines()
num = len(lines)
# i=0
num = 1
for line in lines:
print(f)
li = line.split(',')
x = li[0].lstrip('x:').lstrip(' ').replace('[', '').replace('