Urllib & Requests
Urllib
Python2
import urllib2
from bs4 import BeautifulSoup
#取得url的原始碼
def getHtml(url):
try:
header = {
"Accept" : "text/html",
"User-Agent" : "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_8_2) AppleWebKit/537.22 (KHTML, like Gecko) Chrome/25.0.1364.160 Safari/537.22",
#'Cookie':'over18=1', #可在header傳入參數 ex.八卦版->我已滿18歲
}
request = urllib2.Request(url, headers=header)
soup=BeautifulSoup(urllib2.urlopen(request).read(),'lxml') #記得安裝lxml套件
return soup
except urllib2.HTTPError, e:
return 'error'
except urllib2.URLError, e:
return 'error'Requests
SSL: CERTIFICATE_VERIFY_FAILED
Last updated