doc解析到数据库

def docx_insert_data():
    for files in os.listdir(path):
        print(files)
        if os.path.splitext(files)[1] == '.docx':
            try:
                word = Document(path + '/' + files)
                tables = word.tables
                table = tables[0]
                # print('table  = %s' % table)
                tables = ['sequence_number', 'drug_name', 'enterprise', 'batch_number', 'specification',
                          'source', 'standard', 'result', 'defective_item', 'certification_body', 'placeholder1',
                          'placeholder2', 'placeholder3', 'placeholder4', 'placeholder5', 'placeholder6',
                          'placeholder7',
                          'placeholder8', 'placeholder9', 'placeholder10', 'placeholder11', 'placeholder12',
                          'placeholder13',
                          'placeholder14', 'placeholder15', 'placeholder16', 'placeholder17', 'placeholder18']
                for rows in table.rows:
                    # print('k = %s' % rows)
                    col_list = []
                    for cols in rows.cells:
                        col_list.append(cols.text)
                    # print('col_lists = %s' % col_list)
                    table_jsda = ', '.join(tables[0:len(col_list)])
                    # print('table_jsda = %s' % table_jsda)
                    values_s = ', '.join(['%s'] * len(col_list))
                    # print('values_s = %s' % values_s)
                    sql_query = 'insert into jsda(%s) values(%s)' % (table_jsda, values_s)
                    cursor.execute(sql_query, col_list)
            except Exception as e:
                print(e)
  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值