63 lines
1.7 KiB
Python
63 lines
1.7 KiB
Python
|
import os
|
||
|
import string
|
||
|
import urllib.parse
|
||
|
import urllib.request
|
||
|
from typing import Optional
|
||
|
|
||
|
from .compat import WINDOWS
|
||
|
|
||
|
|
||
|
def get_url_scheme(url: str) -> Optional[str]:
|
||
|
if ":" not in url:
|
||
|
return None
|
||
|
return url.split(":", 1)[0].lower()
|
||
|
|
||
|
|
||
|
def path_to_url(path: str) -> str:
|
||
|
"""
|
||
|
Convert a path to a file: URL. The path will be made absolute and have
|
||
|
quoted path parts.
|
||
|
"""
|
||
|
path = os.path.normpath(os.path.abspath(path))
|
||
|
url = urllib.parse.urljoin("file:", urllib.request.pathname2url(path))
|
||
|
return url
|
||
|
|
||
|
|
||
|
def url_to_path(url: str) -> str:
|
||
|
"""
|
||
|
Convert a file: URL to a path.
|
||
|
"""
|
||
|
assert url.startswith(
|
||
|
"file:"
|
||
|
), f"You can only turn file: urls into filenames (not {url!r})"
|
||
|
|
||
|
_, netloc, path, _, _ = urllib.parse.urlsplit(url)
|
||
|
|
||
|
if not netloc or netloc == "localhost":
|
||
|
# According to RFC 8089, same as empty authority.
|
||
|
netloc = ""
|
||
|
elif WINDOWS:
|
||
|
# If we have a UNC path, prepend UNC share notation.
|
||
|
netloc = "\\\\" + netloc
|
||
|
else:
|
||
|
raise ValueError(
|
||
|
f"non-local file URIs are not supported on this platform: {url!r}"
|
||
|
)
|
||
|
|
||
|
path = urllib.request.url2pathname(netloc + path)
|
||
|
|
||
|
# On Windows, urlsplit parses the path as something like "/C:/Users/foo".
|
||
|
# This creates issues for path-related functions like io.open(), so we try
|
||
|
# to detect and strip the leading slash.
|
||
|
if (
|
||
|
WINDOWS
|
||
|
and not netloc # Not UNC.
|
||
|
and len(path) >= 3
|
||
|
and path[0] == "/" # Leading slash to strip.
|
||
|
and path[1] in string.ascii_letters # Drive letter.
|
||
|
and path[2:4] in (":", ":/") # Colon + end of string, or colon + absolute path.
|
||
|
):
|
||
|
path = path[1:]
|
||
|
|
||
|
return path
|