下面的url,params和http_header通过以下cookiejar和urllib2函数时,返回HTTP 404错误。为什么这样,当我可以在Web浏览器中访问此URL时就可以了?
url = http://stats.ncaa.org/team/442/12911
params = { }
http_header = {
"User-Agent": "Mozilla/5.0 (Windows NT 6.1; WOW64; rv:19.0) Gecko/20100101 Firefox/19.0",
"Accept": "text/plain, */*; q=0.01",
"Accept-Language": "en-US,en;q=0.5",
"DNT": "1",
"Content-Type": "application/x-www-form-urlencoded; charset=UTF-8",
"X-Requested-With": "XMLHttpRequest",
"Referer": "http://stats.ncaa.org/team/inst_team_list?sport_code=WBB&division=3",
"Connection": "keep-alive",
"Pragma": "no-cache",
"Cache-Control": "no-cache"
} # Variables from the HTTP header (default)
def create_cookie():
# Create a cookie handler, if necessary
cookie_jar = cookielib.LWPCookieJar()
cookie = urllib2.HTTPCookieProcessor(cookie_jar)
# Create an urllib2 opener() using our cookie jar
opencookies = urllib2.build_opener(cookie)
return(opencookies)
def grabber(url, params, http_header):
# Create a cookie jar
cookiejar = create_cookie()
# Create the HTTP request
req = urllib2.Request(url, urllib.urlencode(params), http_header)
# Submit the request
res = cookiejar.open(req)
data = res.read()
return(data)