python处理 dbf文件_python读写dbf文件

importstruct,datetime,decimal,itertools

defdbfreader(f):

"""Returns an iterator over records in a Xbase DBF file.

The first row returned contains the field names.

The second row contains field specs: (type, size, decimal places).

Subsequent rows contain the data records.

If a record is marked as deleted, it is skipped.

File should be opened for binary reads.

"""

# See DBF format spec at:

# http://www.pgts.com.au/download/public/xbase.htm#DBF_STRUCT

numrec,lenheader=struct.unpack('

numfields=(lenheader-33)// 32

fields=[]

forfieldnoinxrange(numfields):

name,typ,size,deci=struct.unpack('<11sc4xBB14x',f.read(32))

name=name.replace('\0','')# eliminate NULs from string

fields.append((name,typ,size,deci))

yield[field[0]forfieldinfields]

yield[tuple(field[1:])forfieldinfields]

terminator=f.read(1)

assertterminator=='\r'

fields.insert(0,('DeletionFlag','C',1,0))

fmt=''.join(['%ds'%fieldinfo[2]forfieldinfoinfields])

fmtsiz=struct.calcsize(fmt)

foriinxrange(numrec):

record=struct.unpack(fmt,f.read(fmtsiz))

ifrecord[0]!=' ':

continue# deleted record

result=[]

for(name,typ,size,deci),valueinitertools.izip(fields,record):

ifname=='DeletionFlag':

continue

iftyp=="N":

value=value.replace('\0','').lstrip()

ifvalue=='':

value=0

elifdeci:

value=decimal.Decimal(value)

else:

value=int(value)

eliftyp=='D':

y,m,d=int(value[:4]),int(value[4:6]),int(value[6:8])

value=datetime.date(y,m,d)

eliftyp=='L':

value=(valuein'YyTt'and'T')or(valuein'NnFf'and'F')or'?'

eliftyp=='F':

value=float(value)

result.append(value)

yieldresult

defdbfwriter(f,fieldnames,fieldspecs,records):

""" Return a string suitable for writing directly to a binary dbf file.

File f should be open for writing in a binary mode.

Fieldnames should be no longer than ten characters and not include \x00.

Fieldspecs are in the form (type, size, deci) where

type is one of:

C for ascii character data

M for ascii character memo data (real memo fields not supported)

D for datetime objects

N for ints or decimal objects

L for logical values 'T', 'F', or '?'

size is the field width

deci is the number of decimal places in the provided decimal object

Records can be an iterable over the records (sequences of field values).

"""

# header info

ver=3

now=datetime.datetime.now()

yr,mon,day=now.year-1900,now.month,now.day

numrec=len(records)

numfields=len(fieldspecs)

lenheader=numfields*32+33

lenrecord=sum(field[1]forfieldinfieldspecs)+1

hdr=struct.pack('

f.write(hdr)

# field specs

forname,(typ,size,deci)initertools.izip(fieldnames,fieldspecs):

name=name.ljust(11,'\x00')

fld=struct.pack('<11sc4xBB14x',name,typ,size,deci)

f.write(fld)

# terminator

f.write('\r')

# records

forrecordinrecords:

f.write(' ')# deletion flag

for(typ,size,deci),valueinitertools.izip(fieldspecs,record):

iftyp=="N":

value=str(value).rjust(size,' ')

eliftyp=='D':

value=value.strftime('%Y%m%d')

eliftyp=='L':

value=str(value)[0].upper()

else:

value=str(value)[:size].ljust(size,' ')

assertlen(value)==size

f.write(value)

# End of file

f.write('\x1A')

# -------------------------------------------------------

# Example calls

if__name__=='__main__':

importsys,csv

fromcStringIOimportStringIO

fromoperatorimportitemgetter

# Read a database

filename='/pydev/databases/orders.dbf'

iflen(sys.argv)==2:

filename=sys.argv[1]

f=open(filename,'rb')

db=list(dbfreader(f))

f.close()

forrecordindb:

printrecord

fieldnames,fieldspecs,records=db[0],db[1],db[2:]

# Alter the database

delrecords[4]

records.sort(key=itemgetter(4))

# Remove a field

delfieldnames[0]

delfieldspecs[0]

records=[rec[1:]forrecinrecords]

# Create a new DBF

f=StringIO()

dbfwriter(f,fieldnames,fieldspecs,records)

# Read the data back from the new DBF

print'-'*20

f.seek(0)

forlineindbfreader(f):

printline

f.close()

# Convert to CSV

print'.'*20

f=StringIO()

csv.writer(f).writerow(fieldnames)

csv.writer(f).writerows(records)

printf.getvalue()

f.close()

# Example Output

"""

['ORDER_ID', 'CUSTMR_ID', 'EMPLOY_ID', 'ORDER_DATE', 'ORDER_AMT']

[('C', 10, 0), ('C', 11, 0), ('C', 11, 0), ('D', 8, 0), ('N', 12, 2)]

['10005 ', 'WALNG ', '555 ', datetime.date(1995, 5, 22), Decimal("173.40")]

['10004 ', 'BMARK ', '777 ', datetime.date(1995, 5, 18), Decimal("3194.20")]

['10029 ', 'SAWYH ', '777 ', datetime.date(1995, 6, 29), Decimal("97.30")]

['10013 ', 'RITEB ', '777 ', datetime.date(1995, 6, 2), Decimal("560.40")]

['10024 ', 'RATTC ', '444 ', datetime.date(1995, 6, 21), Decimal("2223.50")]

['10018 ', 'RATTC ', '444 ', datetime.date(1995, 6, 12), Decimal("1076.05")]

['10025 ', 'RATTC ', '444 ', datetime.date(1995, 6, 23), Decimal("185.80")]

['10038 ', 'OLDWO ', '111 ', datetime.date(1995, 7, 14), Decimal("863.96")]

['10002 ', 'MTIME ', '333 ', datetime.date(1995, 5, 16), Decimal("731.80")]

['10007 ', 'MORNS ', '444 ', datetime.date(1995, 5, 24), Decimal("1405.00")]

['10026 ', 'MORNS ', '555 ', datetime.date(1995, 6, 26), Decimal("17.40")]

['10030 ', 'LILLO ', '111 ', datetime.date(1995, 7, 3), Decimal("909.91")]

['10022 ', 'LAPLA ', '111 ', datetime.date(1995, 6, 19), Decimal("671.50")]

['10035 ', 'HIGHG ', '111 ', datetime.date(1995, 7, 11), Decimal("1984.83")]

['10033 ', 'FOODG ', '333 ', datetime.date(1995, 7, 6), Decimal("3401.32")]

--------------------

['CUSTMR_ID', 'EMPLOY_ID', 'ORDER_DATE', 'ORDER_AMT']

[('C', 11, 0), ('C', 11, 0), ('D', 8, 0), ('N', 12, 2)]

['MORNS ', '555 ', datetime.date(1995, 6, 26), Decimal("17.40")]

['SAWYH ', '777 ', datetime.date(1995, 6, 29), Decimal("97.30")]

['WALNG ', '555 ', datetime.date(1995, 5, 22), Decimal("173.40")]

['RATTC ', '444 ', datetime.date(1995, 6, 23), Decimal("185.80")]

['RITEB ', '777 ', datetime.date(1995, 6, 2), Decimal("560.40")]

['LAPLA ', '111 ', datetime.date(1995, 6, 19), Decimal("671.50")]

['MTIME ', '333 ', datetime.date(1995, 5, 16), Decimal("731.80")]

['OLDWO ', '111 ', datetime.date(1995, 7, 14), Decimal("863.96")]

['LILLO ', '111 ', datetime.date(1995, 7, 3), Decimal("909.91")]

['RATTC ', '444 ', datetime.date(1995, 6, 12), Decimal("1076.05")]

['MORNS ', '444 ', datetime.date(1995, 5, 24), Decimal("1405.00")]

['HIGHG ', '111 ', datetime.date(1995, 7, 11), Decimal("1984.83")]

['BMARK ', '777 ', datetime.date(1995, 5, 18), Decimal("3194.20")]

['FOODG ', '333 ', datetime.date(1995, 7, 6), Decimal("3401.32")]

....................

CUSTMR_ID,EMPLOY_ID,ORDER_DATE,ORDER_AMT

MORNS ,555 ,1995-06-26,17.40

SAWYH ,777 ,1995-06-29,97.30

WALNG ,555 ,1995-05-22,173.40

RATTC ,444 ,1995-06-23,185.80

RITEB ,777 ,1995-06-02,560.40

LAPLA ,111 ,1995-06-19,671.50

MTIME ,333 ,1995-05-16,731.80

OLDWO ,111 ,1995-07-14,863.96

LILLO ,111 ,1995-07-03,909.91

RATTC ,444 ,1995-06-12,1076.05

MORNS ,444 ,1995-05-24,1405.00

HIGHG ,111 ,1995-07-11,1984.83

BMARK ,777 ,1995-05-18,3194.20

FOODG ,333 ,1995-07-06,3401.32

"""

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值