新浪爬虫 java_用java实现新浪爬虫,代码完整剖析(仅针对当前SinaSignOn有效)

1 packagemain.java.sina.httpclient;2 importjava.util.HashMap;3 importjava.util.List;4 importjava.util.Map;5

6 importorg.apache.http.HttpResponse;7 importorg.apache.http.cookie.Cookie;8

9 importmain.java.sina.utils.Constant;10 importmain.java.sina.utils.EncodeUtils;11 importmain.java.sina.utils.HttpUtils;12 importmain.java.sina.utils.Utils;13

14 public classSpiderSina {15 privateLoginSina ls;16 private Mapheaders;17 private final int ADDFOLLOWING =1;18 private final int CANCELFOLLOWING =2;19 publicSpiderSina(LoginSina ls){20 this.ls=ls;21 this.headers=new HashMap();22 headers.put("Accept", "text/html, application/xhtml+xml, */*");23 headers.put("Accept-Language", "zh-cn");24 headers.put("User-Agent", "Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0; BOIE9;ZHCN");25 headers.put("Connection", "Keep-Alive");26 headers.put("Cache-Control", "no-cache");27 String cookieValue=HttpUtils.setCookie2String(ls.getCookies());28 headers.put("Cookie", cookieValue);29 }

36 publicString getGroupCategory(){37 String url="http://q.weibo.com/";38 this.headers.put("Host", "q.weibo.com");39 HttpResponse response=HttpUtils.doGet(url, headers);40 String responseText=HttpUtils.getStringFromResponse(response);41 responseText=EncodeUtils.unicdoeToGB2312(responseText);42 returnresponseText;43 }44 public String search(String keyword, intpageNo){

47 String url="http://s.weibo.com/weibo/%25E5%25AE%2581%25E6%25B3%25A2%25E5%25A4%25A7%25E5%25AD%25A6&page="+pageNo;48 String cookieValue = "SINAGLOBAL=8556698272004.724.1417744632425; un=shy_annan@126.com; myuid=5439352084; wvr=6; un=sm2014121904@126.com; _s_tentry=developer.51cto.com; SWB=usrmdinst_14; SUS=SID-5438576807-1419173757-GZ-lrze7-d8e1e3f082b428c12412c8ba30f0a6de; SUE=es%3D4cdfdd5d5f0f75141c092b32f89525a2%26ev%3Dv1%26es2%3D469e50c869315e57efeec3012c3bb6a8%26rs0%3DoWdG36CQ33LUEtKTvGn907Zy1mwFETvSVJsxeHEiaMPcKDB7pFxg596a2pLhFLJfQmswf4AvXYAkzTfemrYgWrz%252BQPustEA2wLNYufYpAZqFsGWanhTBq6elzB2yoZp41xcpy1WwXn1CuvzIzzEYpuILjHahkmJDQDQy6KaxlbA%253D%26rv%3D0; SUP=cv%3D1%26bt%3D1419173757%26et%3D1419260157%26d%3Dc909%26i%3Da6de%26us%3D1%26vf%3D0%26vt%3D0%26ac%3D27%26st%3D0%26uid%3D5438576807%26name%3Dsm2014121904%2540126.com%26nick%3DSocialMedia%25E5%259B%259B%25E5%25A8%2583%26fmp%3D%26lcp%3D; SUB=_2A255kq8tDeTxGeNK6FoU9yjEyzuIHXVa6DVlrDV8PUNbvtBeLW3TkW-bMoi0G_bBfpbS3TMqcXg6zDWFLA..; SUBP=0033WrSXqPxfM725Ws9jqgMF55529P9D9WhGThsH46uNrx1VY0ApV0SR5JpX5KMt; ALF=1450709756; SSOLoginState=1419173757; WBStore=bc5ad8450c3f8a48|undefined; Apache=1027467835228.8901.1419173761694; ULV=1419173761704:6:6:1:1027467835228.8901.1419173761694:1418797827169; UOR=www.ilehao.com,widget.weibo.com,login.sina.com.cn; ULOGIN_IMG=14192385783486";49 headers.put("Accept", "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8");50 //headers.put("Accept-Encoding", "gzip, deflate, sdch");

51 headers.put("Accept-Language", "zh-CN");52 headers.put("User-Agent", "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.71 Safari/537.36");53 headers.put("Connection", "Keep-Alive");54 headers.put("Cache-Control", "max-age=0");55 headers.put("Referer", "http://login.sina.com.cn/sso/login.php?url=http%3A%2F%2Fs.weibo.com%2Fweibo%2F%2525E6%252583%2525A0%2525E6%252599%2525AE%26page%3D2&_rand=1419173756.6387&gateway=1&service=weibo&entry=miniblog&useticket=1&returntype=META");56 headers.put("Cookie", cookieValue);57 this.headers.put("Host", "s.weibo.com");58 HttpResponse response=HttpUtils.doGet(url, headers);59 String responseText=HttpUtils.getStringFromResponse(response);60 responseText=EncodeUtils.unicdoeToGB2312(responseText);61

62

63 returnresponseText;64 }65

66 publicString searchCommentsByUid(String uid){67

68 String url="http://www.weibo.com/u/"+uid;69 String cookieValue = "SINAGLOBAL=8556698272004.724.1417744632425; myuid=2035860051; wvr=6; YF-Ugrow-G0=ad06784f6deda07eea88e095402e4243; SSOLoginState=1423150079; YF-V5-G0=32eb5467e9bfc8b60c2d771056535ac5; _s_tentry=www.weibo.com; Apache=6264929557219.147.1423150103832; ULV=1423150103842:18:2:2:6264929557219.147.1423150103832:1422769721265; ULOGIN_IMG=1423233797946; YF-Page-G0=82cdcdfb16327a659fbb60cc9368fb19; SUS=SID-2035860051-1423286223-GZ-jdkh4-c8ea11de0a42151313986e52f9aa6017; SUE=es%3D8701ff5aca59244ff1ff263cf985bee6%26ev%3Dv1%26es2%3D7995c9eb7455697c09fac4f7486e14eb%26rs0%3DTyXXIRjcEw%252BeS5PaVSM%252FhQjc2JGhKBOe3uFTgShiIUAbPFI2eKtrgxM2wIi9A1xndiTFFM72zY%252FDKYFXONrgkao5cRo%252FHkydV%252FnaQjNmXoeESu5gi6Iq0aX883NhGR0utBVNZb5XaIG3X6HMMfBJC%252B7pnVHogEo8eD6cx8nzN5c%253D%26rv%3D0; SUP=cv%3D1%26bt%3D1423286223%26et%3D1423372623%26d%3Dc909%26i%3D6017%26us%3D1%26vf%3D0%26vt%3D0%26ac%3D0%26st%3D0%26uid%3D2035860051%26name%3Dshy_annan%2540126.com%26nick%3D%25E7%2594%25A8%25E6%2588%25B72035860051%26fmp%3D%26lcp%3D2013-08-18%252021%253A48%253A10; SUB=_2A2550e-fDeTxGeRO6FcZ9i7Mzj2IHXVap0ZXrDV8PUNbvtBuLWnTkW-gBGVORTA7J_lSZzAqzW6E50JjBQ..; SUBP=0033WrSXqPxfM725Ws9jqgMF55529P9D9Wh7oKNCGYcNnhlC6eqqQbbl5JpX5KMt; SUHB=0M20OGRPiOKzyc; ALF=1454822222; UOR=www.ilehao.com,widget.weibo.com,login.sina.com.cn";70 headers.put("Accept", "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8");71 headers.put("Accept-Language", "zh-CN");72 headers.put("User-Agent", "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.71 Safari/537.36");73 headers.put("Connection", "Keep-Alive");74 headers.put("Cache-Control", "max-age=0");75 headers.put("Cookie", cookieValue);76 this.headers.put("Host", "www.weibo.com");77 HttpResponse response=HttpUtils.doGet(url, headers);78 String responseText=HttpUtils.getStringFromResponse(response);79 responseText=EncodeUtils.unicdoeToGB2312(responseText);

82 returnresponseText;83 }

85 //爬虫根据关键字,查询时间断,和查询页数 来得到htmlContent

86 public String search(String keyword, intpageNo, String fromdate,String todate){87 StringBuffer stringBuffer = new StringBuffer(200);

93 stringBuffer.append("http://s.weibo.com/weibo/"+ keyword +"&page=");94 stringBuffer.append(pageNo);95 stringBuffer.append("&typeall=1&suball=1&timescope=custom:");96 stringBuffer.append(fromdate);97 stringBuffer.append(":");98 stringBuffer.append(todate);99 stringBuffer.append("&Refer=g");

104 String url =stringBuffer.toString();105 String cookieValue = headers.get("Cookie");

106 headers.put("Accept", "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8");107 //headers.put("Accept-Encoding", "gzip, deflate, sdch");

108 headers.put("Accept-Language", "zh-CN");109 headers.put("User-Agent", "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.71 Safari/537.36");110 headers.put("Connection", "Keep-Alive");111 headers.put("Cache-Control", "max-age=0");112 headers.put("Referer", "http://s.weibo.com/weibo/%25E5%25AE%2581%25E6%25B3%25A2%25E5%25A4%25A7%25E5%25AD%25A6&typeall=1&suball=1&timescope=custom:"+fromdate+":"+todate+"&Refer=g");113 headers.put("Cookie", cookieValue);114 this.headers.put("Host", "s.weibo.com");115 HttpResponse response=HttpUtils.doGet(url, headers);116 String responseText=HttpUtils.getStringFromResponse(response);117 responseText=EncodeUtils.unicdoeToGB2312(responseText);118

119 System.out.println("************htmlContent start***********");120 System.out.println(responseText);121 System.out.println("************htmlContent end***********");

125 returnresponseText;

127 }

129 public voidforwardToWeiboPage(){130 String url =Constant.personalHomePage;131 headers.put("Accept", "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8");

133 headers.put("Accept-Language", "zh-CN");134 headers.put("User-Agent", "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/39.0.2171.71 Safari/537.36");135 headers.put("Connection", "Keep-Alive");

137 this.headers.put("Host", "s.weibo.com");138 HttpResponse response=HttpUtils.doGet(url, headers);139 String responseText=HttpUtils.getStringFromResponse(response);140 responseText=EncodeUtils.unicdoeToGB2312(responseText);141 List cookies =HttpUtils.getResponseCookies(response);142 String cookie =HttpUtils.setCookie2String(cookies);

144 headers.put("Cookie", cookie);

146 }

150 public String getGroupCategory(intid){151 String url="http://q.weibo.com/class/category/?id="+id;152 this.headers.put("Host", "q.weibo.com");

154 HttpResponse response=HttpUtils.doGet(url, headers);155 String responseText=HttpUtils.getStringFromResponse(response);156 responseText=EncodeUtils.unicdoeToGB2312(responseText);157 returnresponseText;158 }

169 //得到微群管理员ID信息,其实用户成员的第一页 HTML页面

170 publicString getGroupAdministrator(String groupid) {171 String url="http://q.weibo.com/"+groupid+"/members/all";172 this.headers.remove("Referer");173 this.headers.put("Host", "q.weibo.com");174 this.headers.remove("Content-Type");175 this.headers.remove("x-requested-with");176 HttpResponse response=HttpUtils.doGet(url, headers);177 String responseText=HttpUtils.getStringFromResponse(response);178 returnresponseText;179 }180 //根据微群号和页号得到群成员ID信息 -----JSON格式数据

181 public String getGroupMembers(String groupid,intpagenumber){182 this.headers.put("Referer", "http://q.weibo.com/"+groupid+"/members/all");183 this.headers.put("Host", "q.weibo.com");184 this.headers.put("Content-Type", "application/x-www-form-urlencoded");185 this.headers.put("x-requested-with", "XMLHttpRequest");

187 Map params=new HashMap();188 params.put("_t", "0");189 params.put("page", pagenumber+"");190 params.put("gid", groupid);191 params.put("query","");192 params.put("tab", "all");193 params.put("vip", "1");194 String url="http://q.weibo.com/ajax/members/page";195 HttpResponse response=HttpUtils.doPost(url, headers, params);196 returnHttpUtils.getStringFromResponse(response);197 }198 /*

199 * 得到微群中微博信息 经过多次尝试成功200 * 每次获得50个微博记录,page是页号, count值50 可以在1-75之间,但是,每次开始的时候还是从50的倍数开始的201 */

202 public String getGroupTopic(int page,intcount,String gid){203 this.headers.put("Referer", "http://q.weibo.com/"+gid);204 this.headers.put("Host", "q.weibo.com");205 this.headers.put("Content-Type", "application/x-www-form-urlencoded");206 this.headers.put("x-requested-with", "XMLHttpRequest");207 Integer pre_page=1;208 if(page==1){209 pre_page=2;210 }else{211 pre_page=page-1;212 }213 Map params=new HashMap();214 params.put("_k", System.currentTimeMillis()+"");215 params.put("_t", "0");216 params.put("count", count+"");217 //params.put("end_id", end_id);

218 params.put("gid", gid);219 params.put("is_search","");220 params.put("key_word", "");221 params.put("me", "0");222 params.put("mids", "");223 params.put("new", "0");224 params.put("page", page+"");225 params.put("pagebar", "0");

226 params.put("pre_page", pre_page+"");227 params.put("since_id", "0");228 params.put("uid", "0");229

230 String url="http://q.weibo.com/ajax/mblog/groupfeed";231 HttpResponse response=HttpUtils.doPost(url, headers, params);232 returnHttpUtils.getStringFromResponse(response);233 }234 /*

235 * 得到微群中微博信息数目236 * 这个信息中其实还包含了微群的所有的基本信息~~~~~~~~~~****** json格式的数据信息237 */

238 publicString getGroupMessageNumber(String gid){239 this.headers.put("Referer", "http://q.weibo.com/"+gid);240 this.headers.put("Host", "q.weibo.com");241 this.headers.put("Content-Type", "application/x-www-form-urlencoded");242 this.headers.put("x-requested-with", "XMLHttpRequest");243 String url="http://q.weibo.com/ajax/rightnav/groupprofile?gid="+gid+"&_t=0&__rnd="+System.currentTimeMillis();244 HttpResponse response=HttpUtils.doGet(url, headers);245 returnHttpUtils.getStringFromResponse(response);246 }247 //得到微群的主页信息 HTML页码 主要是为了得到第一条微博记录的MID值

248 publicString getgroupMainPage(String groupid) {249 String url="http://q.weibo.com/"+groupid+"?topnav=1";250 this.headers.remove("Referer");251 this.headers.put("Host", "q.weibo.com");252 this.headers.remove("Content-Type");253 this.headers.remove("x-requested-with");254

255 HttpResponse response=HttpUtils.doGet(url, headers);256 String responseText=HttpUtils.getStringFromResponse(response);257 returnresponseText;258 }259 /*

260 * 根据分类得到微群信息261 * categroyID :分类ID号262 * pagenumber:页号263 * sort:分类方式 1 按成员人数 2按 微群博数 3按创建时间分类264 * count:每页的记录数目265 */

266 public String getGroupByCategroy(int categroyID,int pagenumber,int sort,intcount){267 this.headers.put("Referer", "http://q.weibo.com/class/category/?id="+categroyID);268 this.headers.put("Host", "q.weibo.com");269 this.headers.put("Content-Type", "application/x-www-form-urlencoded");270 this.headers.put("x-requested-with", "XMLHttpRequest");271 Map params=new HashMap();272 params.put("_t", "0");273 params.put("page", pagenumber+"");274 params.put("id", categroyID+"");275 params.put("sort",sort+"");276 params.put("count", count+"");277

278 String url="http://q.weibo.com/ajax/class/category";279 HttpResponse response=HttpUtils.doPost(url, headers,params);280 String responseText=HttpUtils.getStringFromResponse(response);281 responseText=EncodeUtils.unicdoeToGB2312(responseText);282 returnresponseText;283 }284 //得到表情列表信息

285 publicString getFaceList(){286 String url="http://weibo.com/aj/mblog/face?type=face&_t=0&__rnd="+System.currentTimeMillis();287 this.headers.put("Referer", "http://weibo.com/");288 this.headers.put("Host", "weibo.com");289 this.headers.put("Content-Type", "application/x-www-form-urlencoded");290 this.headers.put("x-requested-with", "XMLHttpRequest");291

292 HttpResponse response=HttpUtils.doGet(url, headers);293 String responseText=HttpUtils.getStringFromResponse(response);294 System.out.println(responseText);295 Utils.writeFileFromString("tmpFile/faceList.txt", responseText);296 returnresponseText;297 }

307 //用户基本信息 主要是将要解析用户主页下方经过编码后的内容

308 publicString getMemberInfo(String memberID){309 String url="http://weibo.com/"+memberID+"/info";310 this.headers.put("Host", "weibo.com");311 this.headers.put("Referer", "http://weibo.com/u/"+memberID);312 HttpResponse response=HttpUtils.doGet(url, headers);313 String responseText=HttpUtils.getStringFromResponse(response);314 returnresponseText;315 }316 //用户粉丝用户信息 html页面,每次20个

317 public String getMemberFans(String memberID,intpage){318 String url="http://weibo.com/"+memberID+"/fans?&uid=1689219395&tag=&page="+page;319 this.headers.put("Host", "weibo.com");320 this.headers.put("Referer", "http://weibo.com/"+memberID+"/fans");321 HttpResponse response=HttpUtils.doGet(url, headers);322 String responseText=HttpUtils.getStringFromResponse(response);323 returnresponseText;324 }325 //用户关注的用户信息 html页面

326 public String getMemberFollowing(String memberID,intpage){327 String url="http://weibo.com/"+memberID+"/follow?page="+page;328 this.headers.put("Host", "weibo.com");329 this.headers.put("Referer", "http://weibo.com/"+memberID+"/follow");330 HttpResponse response=HttpUtils.doGet(url, headers);331 String responseText=HttpUtils.getStringFromResponse(response);332 returnresponseText;333 }334

335 /*

336 * @params337 * memberID:是用户ID338 * max_id:每次AJAX获得数据时上面一次的最后一个ID值339 * end_id:用户最新的一条微博的ID值340 * k:一个随机数341 * page:页号342 * pre_page:前一页343 * count:每次返回的数值 当max_id为null是 count=50 否则为15344 * pagebar:ajax时,第一次为0,第二次为1345 * 注意:346 * 1 用此请求,每次获得的数据格式都一样,用同样的解析方法来进行解析。347 * 2 每次一页可以获得总共45条记录,需要三次请求。每次请求可获得15条记录。348 * 3 max_id可以不用到,直接等于 end_id就可以了.349 * 4 第一次请求时可以将end_id设置为NUll,即为第一次时翻页时的请求后边的滚动时必须有end_id参数,end_id为第一页的第一条ID即可。350 */

351 //获得用户发布的微博信息 json格式的数据

352 publicString getMemberReleaseTopic(String memberID,String end_id,Integer page,Integer pagebar){353 String url="";354 Integer pre_page=1;355 Integer count=0;356 String k=System.currentTimeMillis()+""+(int)(Math.random()*100000)%100;357 if(end_id==null){358 count=50;359 if(page==1){360 pre_page=2;361 }else{362 pre_page=page-1;363 }364 url="http://weibo.com/aj/mblog/mbloglist?" +

365 "page="+page+"&count="+count+"&pre_page="+pre_page+"&" +

366 "_k="+ k+"&uid="+memberID+

367 "&_t=0&__rnd="+System.currentTimeMillis();368 }else{369 count=15;370 pre_page=page;371 url="http://weibo.com/aj/mblog/mbloglist?" +

372 "page="+page+"&count="+count+"&max_id="+end_id+"&" +

373 "pre_page="+pre_page+"&end_id="+end_id+"&" +

374 "pagebar="+pagebar+"&_k="+k+"&" +

375 "uid="+memberID+"&_t=0&__rnd="+System.currentTimeMillis();376 }377 String cookieValue = "SINAGLOBAL=8556698272004.724.1417744632425; un=sm2014121903@126.com; myuid=5439352084; YF-Ugrow-G0=4703aa1c27ac0c4bab8fc0fc5968141e; SSOLoginState=1421374583; wvr=6; YF-V5-G0=8c4aa275e8793f05bfb8641c780e617b; _s_tentry=login.sina.com.cn; Apache=2461283528245.9854.1421374588453; ULV=1421374588550:13:5:3:2461283528245.9854.1421374588453:1421210767499; UOR=www.ilehao.com,widget.weibo.com,login.sina.com.cn; SUS=SID-2035860051-1421462085-GZ-7jcgb-1539d643bae5195fb7f792b2ae77befb; SUE=es%3Df15e11ed09b6a0108a28adfa58609b78%26ev%3Dv1%26es2%3Da0f706efac5c89495062648a4de3e337%26rs0%3DZBxlOUv0mhmxyHfOVmZ3tH7tNvAp08BjPeLUJPdu9WzG38Dsm40px%252Bd9w21ycDpZQwBK3q0prFfNs%252F8ZuZSasa1eps%252FOGNxJ3CIHN8JN%252Fik6gVpIPgVeeRdalNWTIbth6hLa34uOp%252BXii%252Bxeib%252BvINsr%252FdOvQx6kjp6fsC44QXc%253D%26rv%3D0; SUP=cv%3D1%26bt%3D1421462085%26et%3D1421548485%26d%3Dc909%26i%3Dbefb%26us%3D1%26vf%3D0%26vt%3D0%26ac%3D2%26st%3D0%26uid%3D2035860051%26name%3Dshy_annan%2540126.com%26nick%3D%25E7%2594%25A8%25E6%2588%25B72035860051%26fmp%3D%26lcp%3D2013-08-18%252021%253A48%253A10; SUB=_2A255vboVDeTxGeRO6FcZ9i7Mzj2IHXVazdpdrDV8PUNbvtBuLVj-kW91jmbQSGo7Rn30RVvGP5KOgBgNgQ..; SUBP=0033WrSXqPxfM725Ws9jqgMF55529P9D9Wh7oKNCGYcNnhlC6eqqQbbl5JpX5KMt; ALF=1452998078; ULOGIN_IMG=14214638933178; YF-Page-G0=0acee381afd48776ab7a56bd67c2e7ac";378 headers.put("Cookie", cookieValue);379 this.headers.put("Referer", "http://weibo.com/u/"+memberID);380 this.headers.put("Host", "www.weibo.com");381 this.headers.put("Content-Type", "application/x-www-form-urlencoded");382 this.headers.put("x-requested-with", "XMLHttpRequest");383 url = "http://weibo.com/u/"+memberID;384 HttpResponse response=HttpUtils.doGet(url, headers);385 if(response==null){386 return "";387 }388 returnHttpUtils.getStringFromResponse(response);389 }390 /*

391 * ~~~~~~~~~~~~~~~~~~~~~获取用户的一些信息~~~end~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~392 */

393

394

395 //**********************************************************************************

396

397 /*

398 * 名人堂与达人信息399 */

400 publicString getVerified(String url){401 this.headers.put("Host", "verified.weibo.com");402 this.headers.put("Referer", "http://plaza.weibo.com/?topnav=1&wvr=4");403 HttpResponse response=HttpUtils.doGet(url, headers);404 String responseText=HttpUtils.getStringFromResponse(response);405 returnresponseText;406 }407

408 publicString getVerifiedMember(String path,Integer g_index){409 String url="http://verified.weibo.com/aj/getgrouplist?g_index="+g_index+

410 "&path="+path+"&_t=0&__rnd="+System.currentTimeMillis();411 this.headers.put("Host", "verified.weibo.com");412 this.headers.put("Referer", path);413 this.headers.put("Content-Type", "application/x-www-form-urlencoded");414 this.headers.put("x-requested-with", "XMLHttpRequest");415 HttpResponse response=HttpUtils.doGet(url, headers);416 String responseText=HttpUtils.getStringFromResponse(response);417

418 returnresponseText;419 }420

421 publicString setArea(Integer provinceID){422 this.headers.put("Referer", "http://club.weibo.com/list");423 this.headers.put("Host", "club.weibo.com");424 this.headers.put("Content-Type", "application/x-www-form-urlencoded");425 this.headers.put("x-requested-with", "XMLHttpRequest");426

427 Map params=new HashMap();428

429 params.put("_t", "0");430 params.put("city", "1000");431 params.put("prov", provinceID+"");432

433 String url="http://club.weibo.com/ajax_setArea.php";434 HttpResponse response=HttpUtils.doPost(url, headers, params);435

436 List cks=HttpUtils.getResponseCookies(response);437 List cookies=ls.getCookies();438 cookies.addAll(cks);439 String cookieValue=HttpUtils.setCookie2String(cookies);440 this.headers.put("Cookie", cookieValue);441

442 returnHttpUtils.getStringFromResponse(response);443 }444

445 publicString getDaRen(Integer page){446 String op="ltime";

447 String url="http://club.weibo.com/list?sex=3&op="+op+"&page="+page+"&";448 Integer pre_page=(page<=1? 2:page-1);449 this.headers.put("Host", "club.weibo.com");450 this.headers.put("Referer", "http://club.weibo.com/list?sex=3&op=ltime&page="+pre_page+"&");451 this.headers.remove("Content-Type");452 this.headers.remove("x-requested-with");453

454 HttpResponse response=HttpUtils.doGet(url, headers);455 if(response!= null){456 returnHttpUtils.getStringFromResponse(response);457 }458 return "";459

460 }

470 //发布一条文字微博

471 publicString releaseTopic(String content){472 this.headers.put("Referer", "http://weibo.com/");473 this.headers.put("Host", "weibo.com");474 this.headers.put("Content-Type", "application/x-www-form-urlencoded");475 this.headers.put("x-requested-with", "XMLHttpRequest");476 Map params=new HashMap();477 params.put("_t", "0");478 params.put("location", "home");479 params.put("module", "stissue");480 params.put("pic_id", "");481 params.put("text", content);482 String url="http://weibo.com/aj/mblog/add?__rnd="+System.currentTimeMillis();483 HttpResponse response=HttpUtils.doPost(url, headers, params);484 returnHttpUtils.getStringFromResponse(response);485 }519 //得到自己关注的成员

520 publicString getSelfFollowIngs(){521 return "";522 }523 //得到自己的粉丝

524 publicString getSelfFollowers(){525 return "";526 }527 //得到自己加入的微群

528 publicString getSelfJoinedGroups(){529 return "";530 }531 //得到自己的标签

532 publicString getSelfTags(){533 return "";534 }535 //得到自己发布的微博

536 publicString getSelfReleaseTopics(){537 return "";538 }539 //得到自己主页的微博

540 publicString getSelfPageTopics(){541 return "";542 }543 //关注一个人

544 publicString addFollowing(String memberid){545 return addorcancleFollowing(memberid,this.ADDFOLLOWING);546 }547 //取消关注一个人

548 publicString cancelFollowing(String memberid){549 return addorcancleFollowing(memberid,this.CANCELFOLLOWING);550 }551 private String addorcancleFollowing(String memberid,intoption){552 String url="";553 switch(option){554 caseADDFOLLOWING:555 url="http://weibo.com/aj/f/followed?__rnd="+System.currentTimeMillis();556 break;557 caseCANCELFOLLOWING:558 url="http://weibo.com/aj/f/unfollow?__rnd="+System.currentTimeMillis();559 break;560 }561

562 Map params=new HashMap();563

564 this.headers.put("Referer", "http://weibo.com/");565 this.headers.put("Host", "weibo.com");566 this.headers.put("Content-Type", "application/x-www-form-urlencoded");567 this.headers.put("Referer", "http://weibo.com/");568 this.headers.put("x-requested-with", "XMLHttpRequest");569

570 params.put("_t", "0");571 params.put("f", "1");572 params.put("location", "profile");573 params.put("refer_flag", "");574 params.put("refer_sort", "profile");575 params.put("uid", memberid);576

577 HttpResponse response=HttpUtils.doPost(url, headers, params);578 returnHttpUtils.getStringFromResponse(response);579 }

584 /**

585 * 得到的标签信息 调用一次10个586 *@return

587 */

588 publicString getTags(){589 String url="http://account.weibo.com/set/aj/tagsuggest?__rnd="+System.currentTimeMillis();590 this.headers.put("Referer", "http://account.weibo.com/set/tag#");591 this.headers.put("Host", "account.weibo.com");592 HttpResponse response=HttpUtils.doGet(url, headers);593 returnHttpUtils.getStringFromResponse(response);594 }595

596 /**

597 * 得到微博热词信息598 *@paramk :热词的门类599 */

600 publicString getHotWords(String k){601 String url="http://data.weibo.com/top/keyword?k="+k;602 try{603 Integer.parseInt(k);604 }catch(Exception ex){605 url="http://data.weibo.com/top/keyword?t="+k;606 }607 this.headers.put("Referer", "http://data.weibo.com/top/keyword");608 this.headers.put("Host", "data.weibo.com");609 HttpResponse response=HttpUtils.doGet(url, headers);610 returnHttpUtils.getStringFromResponse(response);611 }612

613 /**

614 * 得到微博热帖子615 *@paramcat 表示热帖门类616 *@parampage 表示页号617 */

618 public String getHotWeibo(String cat,intpage){619 String url="http://data.weibo.com/hot/ajax/catfeed?page="+page+"&cat="+cat+"&_t=0&__rnd="+System.currentTimeMillis();620 this.headers.put("Referer", "http://data.weibo.com/hot/minibloghot");621 this.headers.put("Host", "data.weibo.com");622 HttpResponse response=HttpUtils.doGet(url, headers);623 returnHttpUtils.getStringFromResponse(response);624 }625

626 /**

627 * 按照分类获取 微博吧名字 第一步628 */

629 public String getWeiBar(String ctgid,intp){630 String sort="post";

631 String url="http://weiba.weibo.com/aj_f/CategoryList?sort="+sort+"&p="+p+"&ctgid="+ctgid+"&_t=0&__rnd="+System.currentTimeMillis();632 this.headers.put("Referer", "http://weiba.weibo.com/ct/"+ctgid);633 this.headers.put("Host", "weiba.weibo.com");634 this.headers.put("Accept", "*/*");635 this.headers.put("Content-Type", "application/x-www-form-urlencoded");636 this.headers.put("X-Requested-With", "XMLHttpRequest");637 HttpResponse response=HttpUtils.doGet(url, headers);638 returnHttpUtils.getStringFromResponse(response);639 }640 /**

641 * 根据微博吧 名称 ,得到该吧内的所有帖子标题 第二步642 */

643 public String getWeiBarByWeibarName(String bid,intp){644 String url="http://weiba.weibo.com/aj_t/postlist?bid="+bid+"&p="+p+"&_t=all&__rnd="+System.currentTimeMillis();645 this.headers.put("Referer", "http://weiba.weibo.com/");646 this.headers.put("Host", "weiba.weibo.com");647 this.headers.put("Accept", "*/*");648 this.headers.put("Content-Type", "application/x-www-form-urlencoded");649 this.headers.put("X-Requested-With", "XMLHttpRequest");650 HttpResponse response=HttpUtils.doGet(url, headers);651 returnHttpUtils.getStringFromResponse(response);652 }653

654 /**

655 * 新浪微公益名单656 * type ="donate"657 * type="discuss"658 */

659 public String getWeiGongYiMember(int page,intprojectID,String type){660 String url="http://gongyi.weibo.com/aj_personal_helpdata?page="+page+"&type="+type+"&project_id="+projectID+"&_t=0&__rnd="+System.currentTimeMillis();661 this.headers.put("Referer", "http://gongyi.weibo.com/"+projectID);662 this.headers.put("Host", "gongyi.weibo.com");663 this.headers.put("Accept", "*/*");664 this.headers.put("Content-Type", "application/x-www-form-urlencoded");665 this.headers.put("X-Requested-With", "XMLHttpRequest");666 HttpResponse response=HttpUtils.doGet(url, headers);667 returnHttpUtils.getStringFromResponse(response);668 }669 }

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值