Source code for astropy.utils.xml.unescaper
# Licensed under a 3-clause BSD style license - see LICENSE.rst
"""URL unescaper functions."""
# STDLIB
from xml.sax import saxutils
__all__ = ["unescape_all"]
# This is DIY
_bytes_entities = {
b"&": b"&",
b"<": b"<",
b">": b">",
b"&&": b"&",
b"&&": b"&",
b"%2F": b"/",
}
_bytes_keys = [b"&&", b"&&", b"&", b"<", b">", b"%2F"]
# This is used by saxutils
_str_entities = {"&&": "&", "&&": "&", "%2F": "/"}
_str_keys = ["&&", "&&", "&", "<", ">", "%2F"]
[docs]def unescape_all(url):
"""Recursively unescape a given URL.
.. note:: '&&' becomes a single '&'.
Parameters
----------
url : str or bytes
URL to unescape.
Returns
-------
clean_url : str or bytes
Unescaped URL.
"""
if isinstance(url, bytes):
func2use = _unescape_bytes
keys2use = _bytes_keys
else:
func2use = _unescape_str
keys2use = _str_keys
clean_url = func2use(url)
not_done = [clean_url.count(key) > 0 for key in keys2use]
if True in not_done:
return unescape_all(clean_url)
else:
return clean_url
def _unescape_str(url):
return saxutils.unescape(url, _str_entities)
def _unescape_bytes(url):
clean_url = url
for key in _bytes_keys:
clean_url = clean_url.replace(key, _bytes_entities[key])
return clean_url