|
import os |
|
import socket |
|
import struct |
|
from typing import Optional |
|
from urllib.parse import unquote, urlparse |
|
from ._exceptions import WebSocketProxyException |
|
|
|
""" |
|
_url.py |
|
websocket - WebSocket client library for Python |
|
|
|
Copyright 2024 engn33r |
|
|
|
Licensed under the Apache License, Version 2.0 (the "License"); |
|
you may not use this file except in compliance with the License. |
|
You may obtain a copy of the License at |
|
|
|
http://www.apache.org/licenses/LICENSE-2.0 |
|
|
|
Unless required by applicable law or agreed to in writing, software |
|
distributed under the License is distributed on an "AS IS" BASIS, |
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
|
See the License for the specific language governing permissions and |
|
limitations under the License. |
|
""" |
|
|
|
__all__ = ["parse_url", "get_proxy_info"] |
|
|
|
|
|
def parse_url(url: str) -> tuple: |
|
""" |
|
parse url and the result is tuple of |
|
(hostname, port, resource path and the flag of secure mode) |
|
|
|
Parameters |
|
---------- |
|
url: str |
|
url string. |
|
""" |
|
if ":" not in url: |
|
raise ValueError("url is invalid") |
|
|
|
scheme, url = url.split(":", 1) |
|
|
|
parsed = urlparse(url, scheme="http") |
|
if parsed.hostname: |
|
hostname = parsed.hostname |
|
else: |
|
raise ValueError("hostname is invalid") |
|
port = 0 |
|
if parsed.port: |
|
port = parsed.port |
|
|
|
is_secure = False |
|
if scheme == "ws": |
|
if not port: |
|
port = 80 |
|
elif scheme == "wss": |
|
is_secure = True |
|
if not port: |
|
port = 443 |
|
else: |
|
raise ValueError("scheme %s is invalid" % scheme) |
|
|
|
if parsed.path: |
|
resource = parsed.path |
|
else: |
|
resource = "/" |
|
|
|
if parsed.query: |
|
resource += f"?{parsed.query}" |
|
|
|
return hostname, port, resource, is_secure |
|
|
|
|
|
DEFAULT_NO_PROXY_HOST = ["localhost", "127.0.0.1"] |
|
|
|
|
|
def _is_ip_address(addr: str) -> bool: |
|
try: |
|
socket.inet_aton(addr) |
|
except socket.error: |
|
return False |
|
else: |
|
return True |
|
|
|
|
|
def _is_subnet_address(hostname: str) -> bool: |
|
try: |
|
addr, netmask = hostname.split("/") |
|
return _is_ip_address(addr) and 0 <= int(netmask) < 32 |
|
except ValueError: |
|
return False |
|
|
|
|
|
def _is_address_in_network(ip: str, net: str) -> bool: |
|
ipaddr: int = struct.unpack("!I", socket.inet_aton(ip))[0] |
|
netaddr, netmask = net.split("/") |
|
netaddr: int = struct.unpack("!I", socket.inet_aton(netaddr))[0] |
|
|
|
netmask = (0xFFFFFFFF << (32 - int(netmask))) & 0xFFFFFFFF |
|
return ipaddr & netmask == netaddr |
|
|
|
|
|
def _is_no_proxy_host(hostname: str, no_proxy: Optional[list]) -> bool: |
|
if not no_proxy: |
|
if v := os.environ.get("no_proxy", os.environ.get("NO_PROXY", "")).replace( |
|
" ", "" |
|
): |
|
no_proxy = v.split(",") |
|
if not no_proxy: |
|
no_proxy = DEFAULT_NO_PROXY_HOST |
|
|
|
if "*" in no_proxy: |
|
return True |
|
if hostname in no_proxy: |
|
return True |
|
if _is_ip_address(hostname): |
|
return any( |
|
[ |
|
_is_address_in_network(hostname, subnet) |
|
for subnet in no_proxy |
|
if _is_subnet_address(subnet) |
|
] |
|
) |
|
for domain in [domain for domain in no_proxy if domain.startswith(".")]: |
|
if hostname.endswith(domain): |
|
return True |
|
return False |
|
|
|
|
|
def get_proxy_info( |
|
hostname: str, |
|
is_secure: bool, |
|
proxy_host: Optional[str] = None, |
|
proxy_port: int = 0, |
|
proxy_auth: Optional[tuple] = None, |
|
no_proxy: Optional[list] = None, |
|
proxy_type: str = "http", |
|
) -> tuple: |
|
""" |
|
Try to retrieve proxy host and port from environment |
|
if not provided in options. |
|
Result is (proxy_host, proxy_port, proxy_auth). |
|
proxy_auth is tuple of username and password |
|
of proxy authentication information. |
|
|
|
Parameters |
|
---------- |
|
hostname: str |
|
Websocket server name. |
|
is_secure: bool |
|
Is the connection secure? (wss) looks for "https_proxy" in env |
|
instead of "http_proxy" |
|
proxy_host: str |
|
http proxy host name. |
|
proxy_port: str or int |
|
http proxy port. |
|
no_proxy: list |
|
Whitelisted host names that don't use the proxy. |
|
proxy_auth: tuple |
|
HTTP proxy auth information. Tuple of username and password. Default is None. |
|
proxy_type: str |
|
Specify the proxy protocol (http, socks4, socks4a, socks5, socks5h). Default is "http". |
|
Use socks4a or socks5h if you want to send DNS requests through the proxy. |
|
""" |
|
if _is_no_proxy_host(hostname, no_proxy): |
|
return None, 0, None |
|
|
|
if proxy_host: |
|
if not proxy_port: |
|
raise WebSocketProxyException("Cannot use port 0 when proxy_host specified") |
|
port = proxy_port |
|
auth = proxy_auth |
|
return proxy_host, port, auth |
|
|
|
env_key = "https_proxy" if is_secure else "http_proxy" |
|
value = os.environ.get(env_key, os.environ.get(env_key.upper(), "")).replace( |
|
" ", "" |
|
) |
|
if value: |
|
proxy = urlparse(value) |
|
auth = ( |
|
(unquote(proxy.username), unquote(proxy.password)) |
|
if proxy.username |
|
else None |
|
) |
|
return proxy.hostname, proxy.port, auth |
|
|
|
return None, 0, None |
|
|