#!/bin/python
-- coding: utf-8 --
#获得海盗湾的种子地址 import pycurl import StringIO from bs4 import BeautifulSoup import re def headerCookie(buf): print buf def getEnterRandCode(): #得到登录验证码图 curl = pycurl.Curl() f = StringIO.StringIO() curl.setopt(pycurl.URL, “https://thepiratebay.vg/top/201”) curl.setopt(pycurl.WRITEFUNCTION, f.write) curl.setopt(pycurl.SSL_VERIFYPEER, 0) curl.setopt(pycurl.SSL_VERIFYHOST, 0) curl.setopt(pycurl.TIMEOUT, 300) #连接超时设置 curl.setopt(pycurl.USERAGENT, “Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; .NET CLR 1.1.4322)”) #模拟浏览器 curl.setopt(pycurl.HEADERFUNCTION, headerCookie) curl.setopt(pycurl.COOKIEJAR,”cookie_file_name”) curl.perform() backinfo = ‘’ print curl.getinfo(pycurl.RESPONSE_CODE) if curl.getinfo(pycurl.RESPONSE_CODE) == 200: backinfo = f.getvalue() #print f.getvalue() curl.close() # 生成一个soup对象,doc就是步骤二中提到的 #backinfo = ‘<!DOCTYPE html><html lang="en"><head></head><body><tr><td class="vertTh">
(Movies)


file_object = open('/home/david/Downloads/a.html', 'w')
file_object.write(paper_name)
file_object.close( )
print paper_name getEnterRandCode()