由于用到的数据集很庞大。昨天在服务器上跑了一夜,早上来了发现仍然切了三分之一不到。晚上抽空试了一下使用多进程来切割图像。
切割图像的函数还是使用之前的函数。只是根据mask的标记不能,相对应的代码也有所不同。
import numpy
import openslide
import os
from PIL import Image
import pandas as pd
import numpy as np
import csv
from multiprocessing import Manager
from concurrent.futures import ProcessPoolExecutor
from openslide import OpenSlideUnsupportedFormatError
kimage_csv_path='/home/cad429/code/data/train_chuli.csv'
unmatch_csv_path='/home/cad429/code/data/unmatch.csv'
k_image_path='/home/cad429/code/data/train_images'
k_image_label_path='/home/cad429/code/data/train_label_masks'
#k_image_patch_path='/home/cad429/code/data/splitk'
k_image_patch_path='/data/panda/splitk'
cut_size=512
space_size=512
area=cut_size*cut_size*3/4
def cut(cut_size,space_size,patch_path,image_name):
image_path = os.path.join(k_image_path, image_name + '.tiff')
mask_