usse/scrape/venv/lib/python3.10/site-packages/geopy/geocoders/google.py

443 lines
16 KiB
Python
Raw Normal View History

2023-12-22 14:26:01 +00:00
import base64
import collections.abc
import hashlib
import hmac
from calendar import timegm
from datetime import datetime
from functools import partial
from urllib.parse import urlencode
from geopy.exc import (
ConfigurationError,
GeocoderQueryError,
GeocoderQuotaExceeded,
GeocoderServiceError,
GeocoderUnavailable,
)
from geopy.geocoders.base import DEFAULT_SENTINEL, Geocoder
from geopy.location import Location
from geopy.timezone import ensure_pytz_is_installed, from_timezone_name
from geopy.util import logger
__all__ = ("GoogleV3", )
class GoogleV3(Geocoder):
"""Geocoder using the Google Maps v3 API.
Documentation at:
https://developers.google.com/maps/documentation/geocoding/
Pricing details:
https://developers.google.com/maps/documentation/geocoding/usage-and-billing
"""
api_path = '/maps/api/geocode/json'
timezone_path = '/maps/api/timezone/json'
def __init__(
self,
api_key=None,
*,
domain='maps.googleapis.com',
scheme=None,
client_id=None,
secret_key=None,
timeout=DEFAULT_SENTINEL,
proxies=DEFAULT_SENTINEL,
user_agent=None,
ssl_context=DEFAULT_SENTINEL,
adapter_factory=None,
channel=''
):
"""
:param str api_key: The API key required by Google to perform
geocoding requests, mandatory (unless premier is used,
then both ``client_id`` and ``secret_key`` must be specified
instead).
API keys are managed through
the Google APIs console (https://code.google.com/apis/console).
Make sure to have both ``Geocoding API`` and ``Time Zone API``
services enabled for this API key.
.. versionchanged:: 2.1
Previously a warning has been emitted when neither ``api_key``
nor premier were specified. Now a :class:`geopy.exc.ConfigurationError`
is raised.
:param str domain: Should be the localized Google Maps domain to
connect to. The default is 'maps.googleapis.com', but if you're
geocoding address in the UK (for example), you may want to set it
to 'maps.google.co.uk' to properly bias results.
:param str scheme:
See :attr:`geopy.geocoders.options.default_scheme`.
:param str client_id: If using premier, the account client id.
:param str secret_key: If using premier, the account secret key.
:param int timeout:
See :attr:`geopy.geocoders.options.default_timeout`.
:param dict proxies:
See :attr:`geopy.geocoders.options.default_proxies`.
:param str user_agent:
See :attr:`geopy.geocoders.options.default_user_agent`.
:type ssl_context: :class:`ssl.SSLContext`
:param ssl_context:
See :attr:`geopy.geocoders.options.default_ssl_context`.
:param callable adapter_factory:
See :attr:`geopy.geocoders.options.default_adapter_factory`.
.. versionadded:: 2.0
:param str channel: If using premier, the channel identifier.
"""
super().__init__(
scheme=scheme,
timeout=timeout,
proxies=proxies,
user_agent=user_agent,
ssl_context=ssl_context,
adapter_factory=adapter_factory,
)
if client_id and not secret_key:
raise ConfigurationError('Must provide secret_key with client_id.')
if secret_key and not client_id:
raise ConfigurationError('Must provide client_id with secret_key.')
self.premier = bool(client_id and secret_key)
self.client_id = client_id
self.secret_key = secret_key
if not self.premier and not api_key:
raise ConfigurationError(
'Since July 2018 Google requires each request to have an API key. '
'Pass a valid `api_key` to GoogleV3 geocoder to fix this error. '
'See https://developers.google.com/maps/documentation/geocoding/usage-and-billing' # noqa
)
self.api_key = api_key
self.domain = domain.strip('/')
self.channel = channel
self.api = '%s://%s%s' % (self.scheme, self.domain, self.api_path)
self.tz_api = '%s://%s%s' % (self.scheme, self.domain, self.timezone_path)
def _get_signed_url(self, params):
"""
Returns a Premier account signed url. Docs on signature:
https://developers.google.com/maps/documentation/business/webservices/auth#digital_signatures
"""
params['client'] = self.client_id
if self.channel:
params['channel'] = self.channel
path = "?".join((self.api_path, urlencode(params)))
signature = hmac.new(
base64.urlsafe_b64decode(self.secret_key),
path.encode('utf-8'),
hashlib.sha1
)
signature = base64.urlsafe_b64encode(
signature.digest()
).decode('utf-8')
return '%s://%s%s&signature=%s' % (
self.scheme, self.domain, path, signature
)
def _format_components_param(self, components):
component_items = []
if isinstance(components, collections.abc.Mapping):
component_items = components.items()
elif (
isinstance(components, collections.abc.Sequence)
and not isinstance(components, (str, bytes))
):
component_items = components
else:
raise ValueError(
'`components` parameter must be of type `dict` or `list`')
return "|".join(
":".join(item) for item in component_items
)
def geocode(
self,
query=None,
*,
exactly_one=True,
timeout=DEFAULT_SENTINEL,
bounds=None,
region=None,
components=None,
place_id=None,
language=None,
sensor=False
):
"""
Return a location point by address.
:param str query: The address or query you wish to geocode. Optional,
if ``components`` param is set::
>>> g.geocode(components={"city": "Paris", "country": "FR"})
Location(France, (46.227638, 2.213749, 0.0))
:param bool exactly_one: Return one result or a list of results, if
available.
:param int timeout: Time, in seconds, to wait for the geocoding service
to respond before raising a :class:`geopy.exc.GeocoderTimedOut`
exception. Set this only if you wish to override, on this call
only, the value set during the geocoder's initialization.
:type bounds: list or tuple of 2 items of :class:`geopy.point.Point` or
``(latitude, longitude)`` or ``"%(latitude)s, %(longitude)s"``.
:param bounds: The bounding box of the viewport within which
to bias geocode results more prominently.
Example: ``[Point(22, 180), Point(-22, -180)]``.
:param str region: The region code, specified as a ccTLD
("top-level domain") two-character value.
:type components: dict or list
:param components: Restricts to an area. Can use any combination of:
`route`, `locality`, `administrative_area`, `postal_code`,
`country`.
Pass a list of tuples if you want to specify multiple components of
the same type, e.g.:
>>> [('administrative_area', 'VA'), ('administrative_area', 'Arlington')]
:param str place_id: Retrieve a Location using a Place ID.
Cannot be not used with ``query`` or ``bounds`` parameters.
>>> g.geocode(place_id='ChIJOcfP0Iq2j4ARDrXUa7ZWs34')
:param str language: The language in which to return results.
:param bool sensor: Whether the geocoding request comes from a
device with a location sensor.
:rtype: ``None``, :class:`geopy.location.Location` or a list of them, if
``exactly_one=False``.
"""
params = {
'sensor': str(sensor).lower()
}
if place_id and (bounds or query):
raise ValueError(
'Only one of the `query` or `place id` or `bounds` '
' parameters must be entered.')
if place_id is not None:
params['place_id'] = place_id
if query is not None:
params['address'] = query
if query is None and place_id is None and not components:
raise ValueError('Either `query` or `components` or `place_id` '
'must be set.')
if self.api_key:
params['key'] = self.api_key
if bounds:
params['bounds'] = self._format_bounding_box(
bounds, "%(lat1)s,%(lon1)s|%(lat2)s,%(lon2)s")
if region:
params['region'] = region
if components:
params['components'] = self._format_components_param(components)
if language:
params['language'] = language
if self.premier:
url = self._get_signed_url(params)
else:
url = "?".join((self.api, urlencode(params)))
logger.debug("%s.geocode: %s", self.__class__.__name__, url)
callback = partial(self._parse_json, exactly_one=exactly_one)
return self._call_geocoder(url, callback, timeout=timeout)
def reverse(
self,
query,
*,
exactly_one=True,
timeout=DEFAULT_SENTINEL,
language=None,
sensor=False
):
"""
Return an address by location point.
:param query: The coordinates for which you wish to obtain the
closest human-readable addresses.
:type query: :class:`geopy.point.Point`, list or tuple of ``(latitude,
longitude)``, or string as ``"%(latitude)s, %(longitude)s"``.
:param bool exactly_one: Return one result or a list of results, if
available.
:param int timeout: Time, in seconds, to wait for the geocoding service
to respond before raising a :class:`geopy.exc.GeocoderTimedOut`
exception. Set this only if you wish to override, on this call
only, the value set during the geocoder's initialization.
:param str language: The language in which to return results.
:param bool sensor: Whether the geocoding request comes from a
device with a location sensor.
:rtype: ``None``, :class:`geopy.location.Location` or a list of them, if
``exactly_one=False``.
"""
params = {
'latlng': self._coerce_point_to_string(query),
'sensor': str(sensor).lower()
}
if language:
params['language'] = language
if self.api_key:
params['key'] = self.api_key
if not self.premier:
url = "?".join((self.api, urlencode(params)))
else:
url = self._get_signed_url(params)
logger.debug("%s.reverse: %s", self.__class__.__name__, url)
callback = partial(self._parse_json, exactly_one=exactly_one)
return self._call_geocoder(url, callback, timeout=timeout)
def reverse_timezone(self, query, *, at_time=None, timeout=DEFAULT_SENTINEL):
"""
Find the timezone a point in `query` was in for a specified `at_time`.
`None` will be returned for points without an assigned
Olson timezone id (e.g. for Antarctica).
:param query: The coordinates for which you want a timezone.
:type query: :class:`geopy.point.Point`, list or tuple of (latitude,
longitude), or string as "%(latitude)s, %(longitude)s"
:param at_time: The time at which you want the timezone of this
location. This is optional, and defaults to the time that the
function is called in UTC. Timezone-aware datetimes are correctly
handled and naive datetimes are silently treated as UTC.
:type at_time: :class:`datetime.datetime` or None
:param int timeout: Time, in seconds, to wait for the geocoding service
to respond before raising a :class:`geopy.exc.GeocoderTimedOut`
exception. Set this only if you wish to override, on this call
only, the value set during the geocoder's initialization.
:rtype: ``None`` or :class:`geopy.timezone.Timezone`.
"""
ensure_pytz_is_installed()
location = self._coerce_point_to_string(query)
timestamp = self._normalize_timezone_at_time(at_time)
params = {
"location": location,
"timestamp": timestamp,
}
if self.api_key:
params['key'] = self.api_key
url = "?".join((self.tz_api, urlencode(params)))
logger.debug("%s.reverse_timezone: %s", self.__class__.__name__, url)
return self._call_geocoder(url, self._parse_json_timezone, timeout=timeout)
def _parse_json_timezone(self, response):
self._check_status(response)
timezone_id = response.get("timeZoneId")
if timezone_id is None:
# Google returns `status: ZERO_RESULTS` for uncovered
# points (e.g. for Antarctica), so there's nothing
# meaningful to be returned as the `raw` response,
# hence we return `None`.
return None
return from_timezone_name(timezone_id, raw=response)
def _normalize_timezone_at_time(self, at_time):
if at_time is None:
timestamp = timegm(datetime.utcnow().utctimetuple())
elif isinstance(at_time, datetime):
# Naive datetimes are silently treated as UTC.
# Timezone-aware datetimes are handled correctly.
timestamp = timegm(at_time.utctimetuple())
else:
raise GeocoderQueryError(
"`at_time` must be an instance of `datetime.datetime`"
)
return timestamp
def _parse_json(self, page, exactly_one=True):
places = page.get('results', [])
self._check_status(page)
if not places:
return None
def parse_place(place):
'''Get the location, lat, lng from a single json place.'''
location = place.get('formatted_address')
latitude = place['geometry']['location']['lat']
longitude = place['geometry']['location']['lng']
return Location(location, (latitude, longitude), place)
if exactly_one:
return parse_place(places[0])
else:
return [parse_place(place) for place in places]
def _check_status(self, response):
# https://developers.google.com/maps/documentation/geocoding/requests-geocoding#StatusCodes
status = response.get('status')
if status == 'OK':
return
if status == 'ZERO_RESULTS':
return
error_message = response.get('error_message')
# https://developers.google.com/maps/documentation/geocoding/requests-geocoding#ErrorMessages
# When the geocoder returns a status code other than OK, there *may*
# be an additional error_message field within the Geocoding response
# object.
if status in ('OVER_QUERY_LIMIT', 'OVER_DAILY_LIMIT'):
raise GeocoderQuotaExceeded(
error_message or
'The given key has gone over the requests limit in the 24'
' hour period or has submitted too many requests in too'
' short a period of time'
)
elif status == 'REQUEST_DENIED':
raise GeocoderQueryError(error_message or 'Your request was denied')
elif status == 'INVALID_REQUEST':
raise GeocoderQueryError(
error_message or 'Probably missing address or latlng'
)
elif status == 'UNKNOWN_ERROR':
raise GeocoderUnavailable(error_message or 'Server error')
else:
# Unknown (undocumented) status.
raise GeocoderServiceError(error_message or 'Unknown error')