这本书刘宇宙编,看了一个星期python,收获还是很大,下一步准备学习一下pythonWeb。pythone和java有很多不一样的地方,python站在巨人的肩膀上,让语言变得更简单了。说实话我更喜欢Java,更具逻辑性,更难,也就更有挑战性。我感觉语法中看到PHP、JS、GO的用法,所以看着还是很亲切的。
一、文件改名
这个并不是这本书里面的,只是用python实现更简单
#! /user/bin/python3
# -*-coding:UTF-8-*-
import os
count = 0
movie_name = os.listdir('E:/xwcode/platformWeb/img/bg/')
for temp in movie_name:
dirCMD = 'E:/xwcode/platformWeb/img/bg/'
if "首页" in temp:
oldName = dirCMD + temp
newName = dirCMD
temp2 = temp.replace('首页30', '')
if count <= 9:
newName += temp2[2:7]
elif count <= 99:
newName += temp2[1:7]
else:
newName += temp2
print(newName)
os.renames(oldName, newName)
count += 1
二、网络编程的TCP
网络编程这一章又TCP,还有UDP。下面TCP的服务端和客户端,并没有写入UDP,只是协议不一样。
#! /user/bin/python3
# -*-coding:UTF-8-*-
import socket
import threading
def socket_server():
# AF_INET 指定的是IPV4协议,SOCK_STREAM指定面向流的TCP协议
server_socket = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
host = socket.gethostname()
port = 9999
# 获取本机主机名、指定端口,绑定端口
server_socket.bind((host, port))
# 设置最大连接数,超出排队
server_socket.listen(5)
while True:
# 每个链接必须新建线程,单线程在处理链接的过程中无法接受其他客户端链接
# 被动接受TCP客户端连接、等待连接的到来
sock, addr = server_socket.accept()
t = threading.Thread(target=tcp_link, args=(sock, addr))
t.start()
def tcp_link(sock, addr):
# addr不止一个string
print('new connection form %s:%s....' % addr)
sock.send('welcome to python'.encode('utf-8'))
while True:
# 一次最多接受指定字节数
data = sock.recv(1024).decode('utf-8')
# time.sleep(1)
sock.send(('Hello,%s' % data).encode('utf-8'))
if not data or data == 'exit':
break
sock.close()
print('connect close')
def main():
socket_server()
# 这个系统变量显示了当前模块执行过程中的名称,如果当前程序运行在这个模块中,__name__ 的名称就是__main__如果不是,则为这个模块的名称。
if __name__ == '__main__':
main()
#! /user/bin/python3
# -*-coding:UTF-8-*-
import socket
def socket_client():
client_socket = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
host = socket.gethostname()
port = 9999
# 获取本机主机名、指定端口,绑定端口
client_socket.connect((host, port))
print(client_socket.recv(1024).decode('utf-8'))
while True:
# data = input("请输入")
for data in ['12', '14', '15']:
client_socket.send(data.encode('utf-8'))
print(client_socket.recv(1024).decode('utf-8'))
client_socket.send(b'exit')
break
client_socket.close()
def main():
socket_client()
if __name__ == '__main__':
main()
三、网络爬虫、获取豆瓣电影
#! /user/bin/python3
# -*-coding:UTF-8-*-
from urllib import request
import re
class MovieTop(object):
def __init__(self):
self.start = 0
self.param = '&filter='
self.headers = {
'User-Agent': 'Mozilla/5.0(Windows NT 6.1;WOW64)'
}
self.movie_list = []
self.file_path = 'D:\movie.txt'
def get_page(self):
try:
url = 'https://movie.douban.com/top250?start=' + str(self.start)
req = request.Request(url, headers=self.headers)
response = request.urlopen(req)
page = response.read().decode('utf-8')
page_num = (self.start + 25) // 25
print(page_num)
self.start += 25
return page
except request.URLError as e:
if hasattr(e, 'reason'):
print(e.reason)
def get_movie_info(self):
pattern = re.compile(
u'<div.*?class="item">.*?' + u'<div.*?class="pic">.*?' + u'<em.*?class="">(.*?)</em>.*?' + u'<div.*?class="info">.*?' + u'<span.*?class="title">(.*?)' + u'</span>.*?<span.*?class="title">(.*?)</span>.*?' + u'<span.*?class="other">(.*?)</span>.*?</a>.*?' + u'<div.*?class="bd">.*?<p.*?class="">.*?' + u'导演: (.*?) .*?<br>' + u'(.*?) / (.*?) / ' + u'(.*?)</p>.*?<div.*?class="star">.*?' + u'<span.*?' + u'class="rating_num".*?property="v:average">' + u'(.*?)</span>.*?' + u'.*?<span>(.*?)人评价</span>.*?' + u'<p.*?class="quote">.*?' + u'<span.*?class="inq">(.*?)' + u'</span>.*?</p>',
re.S)
while self.start <= 225:
page = self.get_page()
movies = re.findall(pattern, page)
for movie in movies:
self.movie_list.append(
[movie[0],
movie[1],
movie[2].lstrip(' / '),
movie[3].lstrip(' / '),
movie[4],
movie[5].lstrip(),
movie[6],
movie[7].rstrip(),
movie[8],
movie[9],
movie[10]]
)
def write_text(self):
print('开始向文件写入数据.........')
file_top = open(self.file_path, 'w', encoding='utf-8')
try:
for movie in self.movie_list:
file_top.write('电影排名:' + movie[0] + '\r\n')
file_top.write('电影名称:' + movie[1] + '\r\n')
file_top.write('外文名称:' + movie[2] + '\r\n')
file_top.write('电影别名:' + movie[3] + '\r\n')
file_top.write('导演姓名:' + movie[4] + '\r\n')
file_top.write('上映年份:' + movie[5] + '\r\n')
file_top.write('制作国家/地区:' + movie[6] + '\r\n')
file_top.write('电影类别:' + movie[7] + '\r\n')
file_top.write('电影评分:' + movie[8] + '\r\n')
file_top.write('参评人数:' + movie[9] + '\r\n')
file_top.write('简短影评:' + movie[10] + '\r\n\r\n')
print('抓取结果写入文件成功...')
except Exception as e:
print(e)
finally:
file_top.close()
def main(self):
print('开始从豆瓣电影抓取数据........')
self.get_movie_info()
self.write_text()
print('数据抓取完毕...')
dou_ban_spider = MovieTop()
dou_ban_spider.main()
四、数据库连接
需要pip install pymysql
#! /user/bin/python3
# -*-coding:UTF-8-*-
import pymysql
def connect():
db = pymysql.connect('localhost', 'root', 'root', 'nm3');
cursor = db.cursor()
cursor.execute("SELECT VERSION()")
data = cursor.fetchone()
print("DataBase Version: %s" % data)
db.close()
def main():
connect()
if __name__ == '__main__':
main()