Python 3.6
我正在尝试使用python来爬行Google Maps区域内公交车站的位置。我读过类似的问题,但仍然没有找到解决方法。
raw_decode中的文件“ d:\ ProgramData \ Anaconda3 \ lib \ json \ decoder.py”,第357行 从None提高JSONDecodeError(“期望值”,s,err.value)
JSONDecodeError:期望值这里是代码
跟踪:
回溯(最近通话最近一次):
文件“”,第1行,在 runfile('D:/Dropbox/Lisa/CRC/BusStop/google_place.py',> wdir ='D:/ Dropbox / Lisa / CRC / BusStop')
文件“ D:/ ProgramData / Anaconda3 / lib / site-> packages / spyder / utils / site / sitecustomize.py”,行710,在运行文件中 execfile(文件名,命名空间)
execfile中第101行的文件“ D:/ ProgramData / Anaconda3 / lib / site-> packages / spyder / utils / site / sitecustomize.py” exec(compile(f.read(),文件名,'exec'),命名空间)
文件“ D:/Dropbox/Lisa/CRC/BusStop/google_place.py”的第123行 main()
文件“ D:/Dropbox/Lisa/CRC/BusStop/google_place.py”在主行中的第117行 对于st,st_lat,st_lng,neighborhood_bus_stations(lat,lng,apikeys)中的公交车:
> nearby_bus_stations中的文件“ D:/Dropbox/Lisa/CRC/BusStop/google_place.py”,第73行 “&rankby = distance&language = zh-TW&type = bus_station”)
get_web_json中第48行的文件“ D:/Dropbox/Lisa/CRC/BusStop/google_place.py” 返回json.loads(dataform.decode(“ utf8”))
文件“ d:\ ProgramData \ Anaconda3 \ lib \ json__init __。py”,第354行,正在加载 返回_default_decoder.decode(s)
文件“ d:\ ProgramData \ Anaconda3 \ lib \ json \ decoder.py”,行339,在解码中 obj,end = self.raw_decode(s,idx = _w(s,0).end())
raw_decode中的文件“ d:\ ProgramData \ Anaconda3 \ lib \ json \ decoder.py”,第357行 从None提高JSONDecodeError(“期望值”,s,err.value)
JSONDecodeError:期望值
这是完整的代码:
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
import sys
import json
from urllib.request import urlopen, Request
from lxml import html
import random
def warning(msg):
sys.stderr.write("Warning: %s\n" % msg)
def dump_list(ls):
return '[' + ','.join(ls) + ']'
def get_webpage(url):
""" Given a HTTP/HTTPS url and then returns string
Returns:
string of HTML source code
"""
req = Request(url, headers={'Accept-Charset': 'utf-8', 'Accept-Language': 'zh-tw,en-us;q=0.5'})
with urlopen(req) as rsq:
_, _, charset = rsq.headers['Content-Type'].partition('charset=')
if not charset:
charset = 'utf-8'
htmlbytes = rsq.readall()
charset = charset.strip()
try:
return str(htmlbytes, charset)
except (UnicodeDecodeError):
warning('encoding htmlbytes to {} failed'.format(charset))
with open('UnicodeDecodeError.html', 'wb') as fout:
fout.write(htmlbytes)
raise
def get_web_json(url):
with urlopen(url) as rsq:
# return json.loads(str(rsq.readall(), 'utf8'))
print(str(rsq.read()))
dataform = rsq.read()
# print(dataform)
# return json.loads(str(rsq.read(), 'utf8'))
return json.loads(dataform.decode("utf8"))
print(dataform.decode("utf8"))
def random_key(apikeys):
return apikeys[random.randrange(0, len(apikeys))]
def nearby_bus_stations(lat, lng, apikeys):
""" Return a list of nearby bus stations around the location
Args:
lat: (float) latitude in degrees
lng: (float) longitude in degrees
apikey: Google API Key which enables Place API
Yields:
tuple(station:str, latitude: float, longitude: float, list[bus: string])
Example:
>>> sts = list(nearby_bus_stations(25.021072,121.551788))
>>> print sts[0]
("黎明社教中心", 25.019798, 121.551818, ["懷恩專車S32"])
"""
for apikey in apikeys:
places = get_web_json(
"https://maps.googleapis.com/maps/api/place/nearbysearch/json?" +
"key=%s&location=%f,%f" % (apikey, lat, lng) +
"&rankby=distance&language=zh-TW&type=bus_station")
print("places:",places)#wh
if places['status'] == 'OK':
break
if places['status'] != 'OK':
warning("status=" + places['status'])
return
for result in places['results']:
placeid = result['place_id']
for apikey in apikeys:
detail = get_web_json(
"https://maps.googleapis.com/maps/api/place/details/" +
"json?key=%s&placeid=%s" % (apikey, placeid) +
"&language=zh-TW")
if detail['status'] == 'OK':
break
if detail['status'] != 'OK':
warning("status=" + detail['status'])
break
station = detail['result']['name']
loc = detail['result']['geometry']['location']
buspage = get_webpage(detail['result']['url'])
tree = html.fromstring(buspage)
bus_elm = tree.xpath("/html/body/div[1]/div/div[4]/div[4]/div/div/div[2]/div/div[2]/div[1]/div[2]/div/div/div[2]/div/table/tr/td")
if not bus_elm:
warning('xpath get bus failed')
continue
bus_elm = bus_elm[0]
buses = list(filter(lambda s: len(s.strip()) > 0,
bus_elm.text_content().strip().split()))
yield (station, float(loc['lat']), float(loc['lng']), buses)
def main():
random.seed()
# lat, lng = map(float, sys.argv[1].split(','))
lat, lng = -32.057421,115.770269
# with open('apikeys.json', mode='r') as f:
# apikeys = json.load(f)
apikeys = ["AIzaSyDHRsWPqOZ-LuzAtwCfi2ArKtHH440Pkrk"]
for st, st_lat, st_lng, buses in nearby_bus_stations(lat, lng, apikeys):
print('Station: "{}", ({},{}), Buses={}'.format(
st, st_lat, st_lng, dump_list(buses)))
if __name__ == "__main__":
main()
答案 0 :(得分:0)
函数get_web_json()应该修改为:
def get_web_json(url):
with urlopen(url) as rsq:
dataform = rsq.read().decode().replace('\n','')
return json.loads(dataform)