1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162 |
- import os
- import string
- import urllib.parse
- import urllib.request
- from typing import Optional
- from .compat import WINDOWS
- def get_url_scheme(url: str) -> Optional[str]:
- if ":" not in url:
- return None
- return url.split(":", 1)[0].lower()
- def path_to_url(path: str) -> str:
- """
- Convert a path to a file: URL. The path will be made absolute and have
- quoted path parts.
- """
- path = os.path.normpath(os.path.abspath(path))
- url = urllib.parse.urljoin("file:", urllib.request.pathname2url(path))
- return url
- def url_to_path(url: str) -> str:
- """
- Convert a file: URL to a path.
- """
- assert url.startswith(
- "file:"
- ), f"You can only turn file: urls into filenames (not {url!r})"
- _, netloc, path, _, _ = urllib.parse.urlsplit(url)
- if not netloc or netloc == "localhost":
- # According to RFC 8089, same as empty authority.
- netloc = ""
- elif WINDOWS:
- # If we have a UNC path, prepend UNC share notation.
- netloc = "\\\\" + netloc
- else:
- raise ValueError(
- f"non-local file URIs are not supported on this platform: {url!r}"
- )
- path = urllib.request.url2pathname(netloc + path)
- # On Windows, urlsplit parses the path as something like "/C:/Users/foo".
- # This creates issues for path-related functions like io.open(), so we try
- # to detect and strip the leading slash.
- if (
- WINDOWS
- and not netloc # Not UNC.
- and len(path) >= 3
- and path[0] == "/" # Leading slash to strip.
- and path[1] in string.ascii_letters # Drive letter.
- and path[2:4] in (":", ":/") # Colon + end of string, or colon + absolute path.
- ):
- path = path[1:]
- return path
|