Match latitude and longitude in description for point which don't have an address

This commit is contained in:
Arne Schlüter 2017-01-29 16:29:19 +01:00
commit 03f715c88e

View file

@ -16,7 +16,8 @@ import sys
import time
import random
coords_in_content = re.compile('\/@(-?\d+\.\d+),(-?\d+\.\d+),')
coords_in_content = re.compile(r'\/@(-?\d+\.\d+),(-?\d+\.\d+),')
coords_in_description = re.compile(r'^(-?\d+\.\d+),(-?\d+\.\d+)$')
user_agent = 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/47.0.2526.73 Safari/537.36'
filename = r'GoogleBookmarks.html'
@ -42,9 +43,18 @@ for label in doc.body.iterfind('dl/dt/h3'):
for element, _, url, _ in label.getparent().getnext().iterlinks():
if 'maps.google' in url:
description = element.text or ''
latitude = longitude = None
try:
# check if the link itself contains the coordinate
latitude, longitude = coords_in_description.search(
description).groups()
print("Found point {0},{1} in description".format(
latitude, longitude))
except (AttributeError, IndexError):
safe_query = ['{0}={1}'.format(k, quote_plus(v))
for (k, v) in parse_qsl(urlparse(url).query)]
url = '{0}/?{1}'.format(url.split('/?')[0], '&'.join(safe_query))
url = '{0}/?{1}'.format(url.split('/?')
[0], '&'.join(safe_query))
print('GET {0} {1}'.format(url, description.encode('UTF8')))
browser = Browser()
@ -63,16 +73,13 @@ for label in doc.body.iterfind('dl/dt/h3'):
sock.close()
try:
coords = coords_in_content.search(content).groups()
latitude = coords[0]
longitude = coords[1]
latitude, longitude = coords_in_content.search(
content).groups()
except (AttributeError, IndexError):
print('[Coordinates not found: ' + str(coords) +
'. Try to update "user_agent"]')
print('[Coordinates not found: ({0},{1}).'
'Try to update "user_agent"]'.format(latitude, longitude))
continue
print(latitude, longitude)
try:
kml.newpoint(name=description,
coords=[(float(longitude), float(latitude))])