提取oracle数据库HTML内容转换成正文格式

最新推荐文章于 2022-03-11 16:39:42 发布

qq_41928442

最新推荐文章于 2022-03-11 16:39:42 发布

阅读量2.3k

点赞数

文章标签： oracle python

本文链接：https://blog.csdn.net/qq_41928442/article/details/82976290

版权

提取oracle数据库HTML内容转换成正文格式（去标签）在更新到同表的TZNR

# -*- coding:utf-8 -*-
import cx_Oracle
from bs4 import BeautifulSoup


conn = cx_Oracle.connect('用户名', '用户密码', 'localhost:1521/ORCL')
cur = conn.cursor()

sql_search = 'select WZ,HTML from 表名'
res = cur.execute(sql_search)
# html = cur.fetchone()
rows = cur.fetchall() #得到所有数据集
for row in rows:
    # print(row[0])
    html = BeautifulSoup(row[1],'lxml').text
    # print(html)
    upsql = "UPDATE 表名 t SET t.TZNR = :TZNR WHERE t.WZ = :WZ"
    cur.prepare(upsql)
    cur.execute(None, {'TZNR': html,'WZ': row[0]})
    print('sucess!!!')
    conn.commit()

cur.close()
conn.close()