Table master训练测试流程

CV-deeplearning

已于 2022-09-04 20:28:31 修改

阅读量2.6k

点赞数 2

分类专栏：表格识别专栏文章标签：表格 table master

于 2022-04-24 08:49:51 首次发布

本文链接：https://blog.csdn.net/Guo_Python/article/details/124374526

版权

表格识别专栏专栏收录该内容

9 篇文章

订阅专栏

这篇博客介绍了如何配置环境来运行TableMASTER-mmocr，包括Python、PyTorch和CUDA版本要求。详细步骤包括安装mmdetection、mmcv和mmocr，以及训练和测试表格识别模型的过程。作者还分享了一个用于结构识别的Inference类，并讨论了如何提高模型预测速度。

摘要生成于 C知道，由 DeepSeek-R1 满血版支持，前往体验 >

一. 环境配置

参考：https://github.com/JiaquanYe/TableMASTER-mmocr
由于依赖mmdetection，对版本的要求如下：
Python:3.6+
PyTorch:1.3+
CUDA 9.2+
GCC 5+
在服务器上，在没有sudo权限的情况下配置gcc

export PATH=/home/work/guopei/gcc-8.2.0-bin/bin:$PATH
export PATH=/home/work/guopei/gcc-8.2.0-bin/lib64:$PATH
export LD_LIBRARY_PATH=/home/work/guopei/gcc-8.2.0-bin/lib/:$LD_LIBRARY_PATH

1. 安装mmdetection

cd ./mmdetection-2.11.0
pip install -v -e .

2. 安装 mmcv

pip install mmcv-full==1.3.4 -f https://download.openmmlab.com/mmcv/dist/cu102/torch1.6.0/index.html

3. 安装mmocr

pip install mmocr==0.2.0
cd /home/work/guopei/workspace/OCR/table_recog/TableMASTER-mmocr
pip install -v -e .

4. 检验环境是否安装成功

在这里插入图片描述

二. 训练数据准备

1. 解析pubtabnet数据

python ./table_recognition/data_preprocess.py

运行代码之前记得修改"raw_img_root"和"save_root"路径
我的修改如下：
在这里插入图片描述

2. 生成lmdb数据

python ./table_recognition/lmdb_maker.py

在这里插入图片描述

该代码会生成lmdb，储存在/home/work/data/guopei/pubtabnet/table_master_data/lmdb/文件夹下，如图：

三. 训练模型

sh ./table_recognition/expr/table_recognition_dist_train.sh

在这里插入图片描述

模型训练过程如下：

四. 测试

测试表格结构模型

CUDA_VISIBLE_DEVICES=7 python table_recognition/table_inference_guopei.py

其中，table_inference_guopei.py的内容如下：

import os

import torch
from mmcv.image import imread

from mmdet.apis import init_detector
from mmocr.apis.inference import model_inference
from mmocr.datasets import build_dataset  # noqa: F401
from mmocr.models import build_detector  # noqa: F401

import sys
import glob
import time
import pickle
import numpy as np
from tqdm import tqdm
from table_recognition.utils import detect_visual, end2end_visual, structure_visual, coord_convert, clip_detect_bbox, rectangle_crop_img, delete_invalid_bbox


def build_model(config_file, checkpoint_file):
    device = 'cpu'
    model = init_detector(config_file, checkpoint=checkpoint_file, device=device)

    if model.cfg.data.test['type'] == 'ConcatDataset':
        model.cfg.data.test.pipeline = model.cfg.data.test['datasets'][
            0].pipeline

    return model


class Inference:
    def __init__(self, config_file, checkpoint_file, device=None):
        self.config_file = config_file
        self.checkpoint_file = checkpoint_file
        self.model = build_model(config_file, checkpoint_file)

        if device is None:
            device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
        else:
            # Specify GPU device
            device = torch.device("cuda:{}".format(device))
        self.model.to(device)

    def result_format(self, pred, file_path):
        raise NotImplementedError

    def predict_single_file(self, file_path):
        pass

    def predict_batch(self, imgs):
        pass


class Structure_Recognition(Inference):
    def __init__(self, config_file, checkpoint_file, samples_per_gpu=1):
        self.config_file = config_file
        self.checkpoint_file = checkpoint_file
        super().__init__(config_file, checkpoint_file)
        self.samples_per_gpu = samples_per_gpu

    def result_format(self, pred, file_path=None):
        pred = pred[0]
        return pred

    def predict_single_file(self, file_path):
        # numpy inference
        img = imread(file_path)
        file_name = os.path.basename(file_path)
        result = model_inference(self.model, [img], batch_mode=True)
        result = self.result_format(result, file_path)
        result_dict = {file_name:result}
        return result, result_dict


class Runner:
    def __init__(self, cfg):
        self.structure_master_config = cfg['structure_master_config']
        self.structure_master_ckpt = cfg['structure_master_ckpt']
        self.structure_master_result_folder = cfg['structure_master_result_folder']

        test_folder = cfg['test_folder']

    def init_structure_master(self):
        self.master_structure_inference = \
            Structure_Recognition(self.structure_master_config, self.structure_master_ckpt)

    def release_structure_master(self):
        torch.cuda.empty_cache()
        del self.master_structure_inference

    def do_structure_predict(self, path, is_save=True, gpu_idx=None):
        if isinstance(path, str):
            if os.path.isfile(path):
                all_results = dict()
                print('Single file in structure master prediction ...')
                _, result_dict = self.master_structure_inference.predict_single_file(path)
                all_results.update(result_dict)

            elif os.path.isdir(path):
                all_results = dict()
                print('Folder files in structure master prediction ...')
                search_path = os.path.join(path, '*.png')
                files = glob.glob(search_path)
                files = files[:20]   # 郭沛添加，用来测试使用
                for file in tqdm(files):
                    _, result_dict = self.master_structure_inference.predict_single_file(file)
                    all_results.update(result_dict)

            else:
                raise ValueError

        elif isinstance(path, list):
            all_results = dict()
            print('Chunks files in structure master prediction ...')
            for i, p in enumerate(path):
                _, result_dict = self.master_structure_inference.predict_single_file(p)
                all_results.update(result_dict)
                if gpu_idx is not None:
                    print("[GPU_{} : {} / {}] {} file structure inference. ".format(gpu_idx, i+1, len(path), p))
                else:
                    print("{} file structure inference. ".format(p))

        else:
            raise ValueError

        # save for matcher.
        if is_save:
            if not os.path.exists(self.structure_master_result_folder):
                os.makedirs(self.structure_master_result_folder)

            if not isinstance(path, list):
                save_file = os.path.join(self.structure_master_result_folder, 'structure_master_results.pkl')
            else:
                save_file = os.path.join(self.structure_master_result_folder, 'structure_master_results_{}.pkl'.format(gpu_idx))

            with open(save_file, 'wb') as f:
                pickle.dump(all_results, f)

    def run(self, path):
        # structure master
        self.init_structure_master()
        self.do_structure_predict(path, is_save=True)
        self.release_structure_master()


if __name__ == '__main__':
    cfg = {
        'structure_master_config': './work_dir/1114_TableMASTER_structure/table_master_lmdb_ResnetExtract_Ranger_0930.py',
        'structure_master_ckpt': './work_dir/1114_TableMASTER_structure/latest.pth',
        'structure_master_result_folder': './structure_val_result',
        'test_folder': '/home/work/data/guopei/pubtabnet/val/',
    }

    # single gpu device inference
    runner = Runner(cfg)
    runner.run(cfg['test_folder'])