import xlrd
import numpy as np
import pandas as pd
import jieba
import jieba.analyse
import codecs
from openpyxl import Workbook
def insertOne(value1,value2, sheet):
row = [value1,value2]
sheet.append(row)
# 新建excel,并创建sheet
if __name__ == "__main__":
book = Workbook()
sheet = book.create_sheet("sheet" + str(2),0)
sheets = book.get_sheet_names()
file_name = '2-2_data.xlsx'
x1 = xlrd.open_workbook(file_name)
sheet1 = x1.sheet_by_name('sheet1')
rows = sheet1.nrows
cols = sheet1.ncols
# print(rows)
# print(cols)
word_lst = []
# key_lst = []
for i in range(0,rows):
tags = jieba.cut(sheet1.cell_value(i,1),cut_all=False)
for t in tags:
word_lst.append(t)
word_dict = {}
for item in word_lst:
if item not in word_dict:
word_dict[item] = 1
else:
word_dict[item] += 1
pr
Python+jieba实现分词和词频统计并将结果存入Excel
最新推荐文章于 2023-06-06 22:54:30 发布
本文介绍了如何利用Python的jieba库进行中文分词,并结合词频统计,最后将结果保存到Excel文件中,以便于数据分析和可视化。
摘要由CSDN通过智能技术生成