163
#-*- coding: utf-8 -*-
#encoding=utf-8
import MySQLdb
from pyquery import PyQuery
from time import ctime,sleep
import requests
import os
import sys
reload(sys)
sys.setdefaultencoding('utf-8')
def getNews(doc):
for data in doc('.articleList li'):
title = PyQuery(data).find('a').text()
link = PyQuery(data).find('a').attr('href')
addTime = PyQuery(data).children('.postTime').text()
cname = '网易新闻'
comeLink = 'http://www.163.com/'
getData(title,link,cname,addTime,comeLink)
def getData(title,link,cname,addTime,comeLink):
db = MySQLdb.connect(host="localhost", port=3306,user="root",passwd="123456",db="app_chelseafc",charset="utf8")
#db = MySQLdb.connect(host="10.67.15.102", port=3307,user="5330x2woz0",passwd="5iihxiwxx4kjlim5kl4m14wmx115myw0y243y530",db="app_chelseafc",charset="utf8")
cursor = db.cursor()
sql = 'insert into acticle (title,link,cname,addTime,comeLink) values("%s","%s","%s","%s","%s")' % (title,link,cname,addTime,comeLink)
print sql
try:
cursor.execute(sql)
db.commit()
print "success"
except:
db.rollback()
db.close()
if __name__ == '__main__':
r = requests.get("http://sports.163.com/special/y/00051F15/ycqexmore.html")
html = r.text
doc = PyQuery(html);
getNews(doc)
qq:
#-*- coding: utf-8 -*-
#encoding=utf-8
import MySQLdb
from pyquery import PyQuery
from time import ctime,sleep
import requests
import os
import sys
reload(sys)
sys.setdefaultencoding('utf-8')
def getNews(doc):
for data in doc('.newslist li'):
title = PyQuery(data).find('a').text()
link = PyQuery(data).find('a').attr('href')
cname = '腾讯新闻'
comeLink = 'http://www.qq.com/'
addTime = ctime()
getData(title,link,cname,addTime,comeLink)
def getData(title,link,cname,addTime,comeLink):
db = MySQLdb.connect(host="localhost", port=3306,user="root",passwd="123456",db="app_chelseafc",charset="utf8")
#db = MySQLdb.connect(host="10.67.15.102", port=3307,user="5330x2woz0",passwd="5iihxiwxx4kjlim5kl4m14wmx115myw0y243y530",db="app_chelseafc",charset="utf8")
cursor = db.cursor()
sql = 'insert into acticle (title,link,cname,addTime,comeLink) values("%s","%s","%s","%s","%s")' % (title,link,cname,addTime,comeLink)
print sql
try:
cursor.execute(sql)
db.commit()
print "success"
except:
db.rollback()
db.close()
if __name__ == '__main__':
r = requests.get("http://sports.qq.com/l/isocce/yingc/chelse/che.htm")
html = r.text
doc = PyQuery(html);
getNews(doc)
sina:
#-*- coding: utf-8 -*-
#encoding=utf-8
import MySQLdb
from pyquery import PyQuery
from time import ctime,sleep
import requests
import os
import sys
reload(sys)
sys.setdefaultencoding('utf-8')
def getNews(doc):
for data in doc('.d_list_txt li'):
title = PyQuery(data).find('a').text()
link = PyQuery(data).find('a').attr('href')
addTime = PyQuery(data).children('.c_time').text()
cname = '新浪新闻'
comeLink = 'http://www.sina.com.cn/'
getData(title,link,cname,addTime,comeLink)
def getData(title,link,cname,addTime,comeLink):
db = MySQLdb.connect(host="localhost", port=3306,user="root",passwd="123456",db="app_chelseafc",charset="utf8")
#db = MySQLdb.connect(host="10.67.15.102", port=3307,user="5330x2woz0",passwd="5iihxiwxx4kjlim5kl4m14wmx115myw0y243y530",db="app_chelseafc",charset="utf8")
cursor = db.cursor()
sql = 'insert into acticle (title,link,cname,addTime,comeLink) values("%s","%s","%s","%s","%s")' % (title,link,cname,addTime,comeLink)
print sql
try:
cursor.execute(sql)
db.commit()
print "success"
except:
db.rollback()
db.close()
if __name__ == '__main__':
r = requests.get("http://roll.sports.sina.com.cn/s_premierleague_all/3/index.shtml")
r.encoding ='gb2312'
html = r.text
doc = PyQuery(html)
getNews(doc)