python中文本预处理的一般流程_如何用python进行文本预处理

展开全部

#!/usr/bin/python

#print "Hello World"

str_seperator = "=================================================================================="

timePointName = ["enter OpenNextImage at",#0

"enter OpenImage at",#1

"In OpenImage send On_ImageRefresh at",#2

"leave OpenImage at",#3

"leave OpenNextImage at",#4

"enter LoadImage at",#5

"decode began at",#6

"enter DrawClient at",#7

"leave DrawClient at",#8

"decode end at",#9

"in LoadImage send On_ImageRefresh at",#10

"leave loadImage at",#11

"second enter DrawClient at",#12

"second leave DrawClient at" #13

]

itemNumber= 0;

avgTotal = 0; #13-0

avgFirstDraw = 0; #8-2

avgLoadImage = 0; #11-5

avgSecondDraw = 0;#13-10

fobj = open("F:\log.txt","r")

imageTimeSta = {}

dic = {}

path = ""

idx = 0

for line in fobj:

idx = idx + 1

if idx == 1:

line = line[3:]

else:

pass

line = line.strip()

line = line.decode("utf-8").encode("gbk")

if line == str_seperator:

if path == "":

pass

else:

imageTimeSta[path] = dic

dic = {}

path = ""

continue

tabIndex = line.find('\t')

if tabIndex == -1:

path = line

print path

continue

tabLastIndex = line.rfind('\t')

name = line[0:tabIndex]

time = int(line[tabLastIndex + 1:])

if name in dic:

dic["second " + name] = time

else:

dic[name] = time

fobj.close()

itemNumber = len(imageTimeSta)

keys = imageTimeSta.keys();

for (k,dic) in imageTimeSta.iteritems():

avgTotal += dic[timePointName[13]] - dic[timePointName[0]];

avgFirstDraw += dic[timePointName[8]] - dic[timePointName[2]];

avgLoadImage += dic[timePointName[11]] - dic[timePointName[5]];

avgSecondDraw += dic[timePointName[13]] - dic[timePointName[10]];

print 'avgTotal',avgTotal / float(itemNumber)

print 'avgFirstDraw',avgFirstDraw / float(itemNumber)

print 'avgLoadImage',avgLoadImage / float(itemNumber)

print 'avgSecondDraw',avgSecondDraw / float(itemNumber)

#print imageTimeSta

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值