def compute():
with open('instances_train2019.json') as fid:
data = json.load(fid)
images = {}
for x in data['images']:
images[x['id']] = x
annotations = {}
for x in data['annotations']:
annotations[images[x['image_id']]['file_name']] = x
object_paths = glob.glob(os.path.join('', '*.jpg'))
object_category_paths = defaultdict(list)
for path in object_paths:
name = os.path.basename(path)
category = annotations[name]['category_id']
object_category_paths[category].append(path)#每一个种类有很多图片
object_category_paths = dict(object_category_paths)
ratio_anns = {}
for category, paths in tqdm(object_category_paths.items()):#每一个种类有很多图片
areas = []
for object_path in paths:
name = os.path.basename(object_path)
mask_path = os.path.join('', '{}.png'.format(name.split('.')[0]))
mask = Image.open(mask_path).convert('L')
area = np.array(mask, dtype=np.bool).sum()###二值图,白色为1,黑色为0
areas.append(area)
areas = np.array(areas)
max_area = areas.max()
ratios = np.round(areas / max_area, 3)
for i, object_path in enumerate(paths):
name = os.path.basename(object_path)
ratio_anns[name] = ratios[i]
with open('ratio_annotations.json', 'w') as fid:
json.dump(ratio_anns, fid)
if __name__ == '__main__':
compute()