usse/funda-scraper/venv/lib/python3.10/site-packages/geopy/geocoders/arcgis.py

329 lines
12 KiB
Python

import json
from functools import partial
from time import time
from urllib.parse import urlencode
from geopy.exc import (
ConfigurationError,
GeocoderAuthenticationFailure,
GeocoderServiceError,
)
from geopy.geocoders.base import DEFAULT_SENTINEL, Geocoder, _synchronized
from geopy.location import Location
from geopy.util import logger
__all__ = ("ArcGIS", )
DEFAULT_WKID = 4326
class ArcGIS(Geocoder):
"""Geocoder using the ERSI ArcGIS API.
Documentation at:
https://developers.arcgis.com/rest/geocode/api-reference/overview-world-geocoding-service.htm
"""
_TOKEN_EXPIRED = 498
auth_path = '/sharing/generateToken'
geocode_path = '/arcgis/rest/services/World/GeocodeServer/findAddressCandidates'
reverse_path = '/arcgis/rest/services/World/GeocodeServer/reverseGeocode'
def __init__(
self,
username=None,
password=None,
*,
referer=None,
token_lifetime=60,
scheme=None,
timeout=DEFAULT_SENTINEL,
proxies=DEFAULT_SENTINEL,
user_agent=None,
ssl_context=DEFAULT_SENTINEL,
adapter_factory=None,
auth_domain='www.arcgis.com',
domain='geocode.arcgis.com'
):
"""
:param str username: ArcGIS username. Required if authenticated
mode is desired.
:param str password: ArcGIS password. Required if authenticated
mode is desired.
:param str referer: Required if authenticated mode is desired.
`Referer` HTTP header to send with each request,
e.g., ``'http://www.example.com'``. This is tied to an issued token,
so fielding queries for multiple referrers should be handled by
having multiple ArcGIS geocoder instances.
:param int token_lifetime: Desired lifetime, in minutes, of an
ArcGIS-issued token.
:param str scheme:
See :attr:`geopy.geocoders.options.default_scheme`.
If authenticated mode is in use, it must be ``'https'``.
:param int timeout:
See :attr:`geopy.geocoders.options.default_timeout`.
:param dict proxies:
See :attr:`geopy.geocoders.options.default_proxies`.
:param str user_agent:
See :attr:`geopy.geocoders.options.default_user_agent`.
:type ssl_context: :class:`ssl.SSLContext`
:param ssl_context:
See :attr:`geopy.geocoders.options.default_ssl_context`.
:param callable adapter_factory:
See :attr:`geopy.geocoders.options.default_adapter_factory`.
.. versionadded:: 2.0
:param str auth_domain: Domain where the target ArcGIS auth service
is hosted. Used only in authenticated mode (i.e. username,
password and referer are set).
:param str domain: Domain where the target ArcGIS service
is hosted.
"""
super().__init__(
scheme=scheme,
timeout=timeout,
proxies=proxies,
user_agent=user_agent,
ssl_context=ssl_context,
adapter_factory=adapter_factory,
)
if username or password or referer:
if not (username and password and referer):
raise ConfigurationError(
"Authenticated mode requires username,"
" password, and referer"
)
if self.scheme != 'https':
raise ConfigurationError(
"Authenticated mode requires scheme of 'https'"
)
self.username = username
self.password = password
self.referer = referer
self.auth_domain = auth_domain.strip('/')
self.auth_api = (
'%s://%s%s' % (self.scheme, self.auth_domain, self.auth_path)
)
self.token_lifetime = token_lifetime * 60 # store in seconds
self.domain = domain.strip('/')
self.api = (
'%s://%s%s' % (self.scheme, self.domain, self.geocode_path)
)
self.reverse_api = (
'%s://%s%s' % (self.scheme, self.domain, self.reverse_path)
)
# Mutable state
self.token = None
self.token_expiry = None
def geocode(self, query, *, exactly_one=True, timeout=DEFAULT_SENTINEL,
out_fields=None):
"""
Return a location point by address.
:param str query: The address or query you wish to geocode.
:param bool exactly_one: Return one result or a list of results, if
available.
:param int timeout: Time, in seconds, to wait for the geocoding service
to respond before raising a :class:`geopy.exc.GeocoderTimedOut`
exception. Set this only if you wish to override, on this call
only, the value set during the geocoder's initialization.
:param out_fields: A list of output fields to be returned in the
attributes field of the raw data. This can be either a python
list/tuple of fields or a comma-separated string. See
https://developers.arcgis.com/rest/geocode/api-reference/geocoding-service-output.htm
for a list of supported output fields. If you want to return all
supported output fields, set ``out_fields="*"``.
:type out_fields: str or iterable
:rtype: ``None``, :class:`geopy.location.Location` or a list of them, if
``exactly_one=False``.
"""
params = {'singleLine': query, 'f': 'json'}
if exactly_one:
params['maxLocations'] = 1
if out_fields is not None:
if isinstance(out_fields, str):
params['outFields'] = out_fields
else:
params['outFields'] = ",".join(out_fields)
url = "?".join((self.api, urlencode(params)))
logger.debug("%s.geocode: %s", self.__class__.__name__, url)
callback = partial(self._parse_geocode, exactly_one=exactly_one)
return self._authenticated_call_geocoder(url, callback, timeout=timeout)
def _parse_geocode(self, response, exactly_one):
if 'error' in response:
raise GeocoderServiceError(str(response['error']))
# Success; convert from the ArcGIS JSON format.
if not len(response['candidates']):
return None
geocoded = []
for resource in response['candidates']:
geometry = resource['location']
geocoded.append(
Location(
resource['address'], (geometry['y'], geometry['x']), resource
)
)
if exactly_one:
return geocoded[0]
return geocoded
def reverse(self, query, *, exactly_one=True, timeout=DEFAULT_SENTINEL,
distance=None):
"""
Return an address by location point.
:param query: The coordinates for which you wish to obtain the
closest human-readable addresses.
:type query: :class:`geopy.point.Point`, list or tuple of ``(latitude,
longitude)``, or string as ``"%(latitude)s, %(longitude)s"``.
:param bool exactly_one: Return one result or a list of results, if
available.
:param int timeout: Time, in seconds, to wait for the geocoding service
to respond before raising a :class:`geopy.exc.GeocoderTimedOut`
exception. Set this only if you wish to override, on this call
only, the value set during the geocoder's initialization.
:param int distance: Distance from the query location, in meters,
within which to search. ArcGIS has a default of 100 meters, if not
specified.
:rtype: ``None``, :class:`geopy.location.Location` or a list of them, if
``exactly_one=False``.
"""
location = self._coerce_point_to_string(query, "%(lon)s,%(lat)s")
wkid = DEFAULT_WKID
params = {'location': location, 'f': 'json', 'outSR': wkid}
if distance is not None:
params['distance'] = distance
url = "?".join((self.reverse_api, urlencode(params)))
logger.debug("%s.reverse: %s", self.__class__.__name__, url)
callback = partial(self._parse_reverse, exactly_one=exactly_one)
return self._authenticated_call_geocoder(url, callback, timeout=timeout)
def _parse_reverse(self, response, exactly_one):
if not len(response):
return None
if 'error' in response:
# https://developers.arcgis.com/rest/geocode/api-reference/geocoding-service-output.htm
if response['error']['code'] == 400:
# 'details': ['Unable to find address for the specified location.']}
try:
if 'Unable to find' in response['error']['details'][0]:
return None
except (KeyError, IndexError):
pass
raise GeocoderServiceError(str(response['error']))
if response['address'].get('Address'):
address = (
"%(Address)s, %(City)s, %(Region)s %(Postal)s,"
" %(CountryCode)s" % response['address']
)
else:
address = response['address']['LongLabel']
location = Location(
address,
(response['location']['y'], response['location']['x']),
response['address']
)
if exactly_one:
return location
else:
return [location]
def _authenticated_call_geocoder(
self, url, parse_callback, *, timeout=DEFAULT_SENTINEL
):
if not self.username:
return self._call_geocoder(url, parse_callback, timeout=timeout)
def query_callback():
call_url = "&".join((url, urlencode({"token": self.token})))
headers = {"Referer": self.referer}
return self._call_geocoder(
call_url,
partial(maybe_reauthenticate_callback, from_token=self.token),
timeout=timeout,
headers=headers,
)
def maybe_reauthenticate_callback(response, *, from_token):
if "error" in response:
if response["error"]["code"] == self._TOKEN_EXPIRED:
return self._refresh_authentication_token(
query_retry_callback, timeout=timeout, from_token=from_token
)
return parse_callback(response)
def query_retry_callback():
call_url = "&".join((url, urlencode({"token": self.token})))
headers = {"Referer": self.referer}
return self._call_geocoder(
call_url, parse_callback, timeout=timeout, headers=headers
)
if self.token is None or int(time()) > self.token_expiry:
return self._refresh_authentication_token(
query_callback, timeout=timeout, from_token=self.token
)
else:
return query_callback()
@_synchronized
def _refresh_authentication_token(self, callback_success, *, timeout, from_token):
if from_token != self.token:
# Token has already been updated by a concurrent call.
return callback_success()
token_request_arguments = {
'username': self.username,
'password': self.password,
'referer': self.referer,
'expiration': self.token_lifetime,
'f': 'json'
}
url = "?".join((self.auth_api, urlencode(token_request_arguments)))
logger.debug(
"%s._refresh_authentication_token: %s",
self.__class__.__name__, url
)
def cb(response):
if "token" not in response:
raise GeocoderAuthenticationFailure(
"Missing token in auth request."
"Request URL: %s; response JSON: %s" % (url, json.dumps(response))
)
self.token = response["token"]
self.token_expiry = int(time()) + self.token_lifetime
return callback_success()
return self._call_geocoder(url, cb, timeout=timeout)