diff --git a/httpcore/__init__.py b/httpcore/__init__.py index 014213ba..30720ef5 100644 --- a/httpcore/__init__.py +++ b/httpcore/__init__.py @@ -3,6 +3,7 @@ AsyncConnectionInterface, AsyncConnectionPool, AsyncHTTP2Connection, + AsyncHTTP3Connection, AsyncHTTP11Connection, AsyncHTTPConnection, AsyncHTTPProxy, @@ -40,6 +41,7 @@ ConnectionInterface, ConnectionPool, HTTP2Connection, + HTTP3Connection, HTTP11Connection, HTTPConnection, HTTPProxy, @@ -85,6 +87,7 @@ def __init__(self, *args, **kwargs): # type: ignore "AsyncHTTPProxy", "AsyncHTTP11Connection", "AsyncHTTP2Connection", + "AsyncHTTP3Connection", "AsyncConnectionInterface", "AsyncSOCKSProxy", # sync @@ -93,6 +96,7 @@ def __init__(self, *args, **kwargs): # type: ignore "HTTPProxy", "HTTP11Connection", "HTTP2Connection", + "HTTP3Connection", "ConnectionInterface", "SOCKSProxy", # network backends, implementations diff --git a/httpcore/_async/__init__.py b/httpcore/_async/__init__.py index 88dc7f01..39cd1abe 100644 --- a/httpcore/_async/__init__.py +++ b/httpcore/_async/__init__.py @@ -16,6 +16,18 @@ def __init__(self, *args, **kwargs) -> None: # type: ignore ) +try: + from .http3 import AsyncHTTP3Connection +except ImportError: # pragma: nocover + + class AsyncHTTP3Connection: # type: ignore + def __init__(self, *args, **kwargs) -> None: # type: ignore + raise RuntimeError( + "Attempted to use http3 support, but the `aioquic` package is not " + "installed. Use 'pip install httpcore[http3]'." + ) + + try: from .socks_proxy import AsyncSOCKSProxy except ImportError: # pragma: nocover @@ -34,6 +46,7 @@ def __init__(self, *args, **kwargs) -> None: # type: ignore "AsyncHTTPProxy", "AsyncHTTP11Connection", "AsyncHTTP2Connection", + "AsyncHTTP3Connection", "AsyncConnectionInterface", "AsyncSOCKSProxy", ] diff --git a/httpcore/_async/connection.py b/httpcore/_async/connection.py index 2f439cf0..a2808d6b 100644 --- a/httpcore/_async/connection.py +++ b/httpcore/_async/connection.py @@ -41,6 +41,7 @@ def __init__( keepalive_expiry: Optional[float] = None, http1: bool = True, http2: bool = False, + http3: bool = False, retries: int = 0, local_address: Optional[str] = None, uds: Optional[str] = None, @@ -52,6 +53,7 @@ def __init__( self._keepalive_expiry = keepalive_expiry self._http1 = http1 self._http2 = http2 + self._http3 = http3 self._retries = retries self._local_address = local_address self._uds = uds @@ -80,7 +82,18 @@ async def handle_async_request(self, request: Request) -> Response: ssl_object is not None and ssl_object.selected_alpn_protocol() == "h2" ) - if http2_negotiated or (self._http2 and not self._http1): + if self._http3 and not ( + self._http1 or self._http2 + ): # pragma: no cover + from .http3 import AsyncHTTP3Connection + + stream = await self._connect_http3(request) + self._connection = AsyncHTTP3Connection( + origin=self._origin, + stream=stream, + keepalive_expiry=self._keepalive_expiry, + ) + elif http2_negotiated or (self._http2 and not self._http1): from .http2 import AsyncHTTP2Connection self._connection = AsyncHTTP2Connection( @@ -162,6 +175,30 @@ async def _connect(self, request: Request) -> AsyncNetworkStream: async with Trace("retry", logger, request, kwargs) as trace: await self._network_backend.sleep(delay) + async def _connect_http3( + self, request: Request + ) -> AsyncNetworkStream: # pragma: nocover + retries_left = self._retries + delays = exponential_backoff(factor=RETRIES_BACKOFF_FACTOR) + + while True: + try: + kwargs = { + "host": self._origin.host.decode("ascii"), + "port": self._origin.port, + } + async with Trace("connect_udp", logger, request, kwargs) as trace: + stream = await self._network_backend.connect_udp(**kwargs) # type: ignore + trace.return_value = stream + return stream + except (ConnectError, ConnectTimeout): + if retries_left <= 0: + raise + retries_left -= 1 + delay = next(delays) + async with Trace("retry", logger, request, kwargs) as trace: + await self._network_backend.sleep(delay) + def can_handle_request(self, origin: Origin) -> bool: return origin == self._origin diff --git a/httpcore/_async/connection_pool.py b/httpcore/_async/connection_pool.py index 214dfc4b..e09ea11f 100644 --- a/httpcore/_async/connection_pool.py +++ b/httpcore/_async/connection_pool.py @@ -53,6 +53,7 @@ def __init__( keepalive_expiry: Optional[float] = None, http1: bool = True, http2: bool = False, + http3: bool = False, retries: int = 0, local_address: Optional[str] = None, uds: Optional[str] = None, @@ -77,6 +78,8 @@ def __init__( by the connection pool. Defaults to True. http2: A boolean indicating if HTTP/2 requests should be supported by the connection pool. Defaults to False. + http3: A boolean indicating if HTTP/3 requests should be supported by + the connection pool. Defaults to False. retries: The maximum number of retries when trying to establish a connection. local_address: Local address to connect from. Can also be used to connect @@ -105,6 +108,7 @@ def __init__( self._keepalive_expiry = keepalive_expiry self._http1 = http1 self._http2 = http2 + self._http3 = http3 self._retries = retries self._local_address = local_address self._uds = uds @@ -131,6 +135,7 @@ def create_connection(self, origin: Origin) -> AsyncConnectionInterface: keepalive_expiry=self._keepalive_expiry, http1=self._http1, http2=self._http2, + http3=self._http3, retries=self._retries, local_address=self._local_address, uds=self._uds, diff --git a/httpcore/_async/http3.py b/httpcore/_async/http3.py new file mode 100644 index 00000000..71b69043 --- /dev/null +++ b/httpcore/_async/http3.py @@ -0,0 +1,497 @@ +import enum +import logging +import time +import types +import typing +from time import monotonic + +import certifi +from aioquic.h3 import events as h3_events, exceptions as h3_exceptions +from aioquic.h3.connection import H3Connection +from aioquic.quic import events as quic_events +from aioquic.quic.configuration import QuicConfiguration +from aioquic.quic.connection import QuicConnection, QuicConnectionState + +from .._backends.base import AsyncNetworkStream +from .._exceptions import ( + ConnectionNotAvailable, + LocalProtocolError, + RemoteProtocolError, +) +from .._models import Origin, Request, Response +from .._synchronization import AsyncLock, AsyncShieldCancellation +from .._trace import Trace +from .interfaces import AsyncConnectionInterface + +logger = logging.getLogger("httpcore.http3") + + +def has_body_headers(request: Request) -> bool: + return any( + k.lower() == b"content-length" or k.lower() == b"transfer-encoding" + for k, v in request.headers + ) + + +class HTTPConnectionState(enum.IntEnum): + ACTIVE = 1 + IDLE = 2 + CLOSED = 3 + + +class AsyncHTTP3Connection(AsyncConnectionInterface): + READ_NUM_BYTES = 64 * 1024 + + def __init__( + self, + origin: Origin, + stream: AsyncNetworkStream, + keepalive_expiry: typing.Optional[float] = None, + ): + quic_configuration = QuicConfiguration( + alpn_protocols=["h3", "h3-32", "h3-31", "h3-30", "h3-29"], + is_client=True, + ) + quic_configuration.server_name = origin.host.decode("ascii") + quic_configuration.cafile = certifi.where() + + self._origin = origin + self._network_stream = stream + self._keepalive_expiry: typing.Optional[float] = keepalive_expiry + self._quic_conn = QuicConnection(configuration=quic_configuration) + self._h3_state = H3Connection(quic=self._quic_conn) + self._state = HTTPConnectionState.IDLE + self._expire_at: typing.Optional[float] = None + self._request_count = 0 + self._state_lock = AsyncLock() + self._read_lock = AsyncLock() + self._write_lock = AsyncLock() + self._handshake_lock = AsyncLock() + self._handshake_done = False + self._sent_connection_init = False + self._used_all_stream_ids = False + self._connection_error = False + + # Mapping from stream ID to response stream events. + self._events: typing.Dict[ + int, + typing.Union[ + h3_events.ResponseReceived, + h3_events.DataReceived, + quic_events.StreamReset, + ], + ] = {} + + # Connection terminated events are stored as state since + # we need to handle them for all streams. + self._connection_terminated: typing.Optional[ + quic_events.ConnectionTerminated + ] = None + + self._read_exception: typing.Optional[Exception] = None + self._write_exception: typing.Optional[Exception] = None + + async def handle_async_request(self, request: Request) -> Response: + if not self.can_handle_request(request.url.origin): + # This cannot occur in normal operation, since the connection pool + # will only send requests on connections that handle them. + # It's in place simply for resilience as a guard against incorrect + # usage, for anyone working directly with httpcore connections. + raise RuntimeError( + f"Attempted to send request to {request.url.origin} on connection " + f"to {self._origin}" + ) + + async with self._state_lock: + if self._state in (HTTPConnectionState.ACTIVE, HTTPConnectionState.IDLE): + self._request_count += 1 + self._expire_at = None + self._state = HTTPConnectionState.ACTIVE + else: + raise ConnectionNotAvailable() + + async with self._handshake_lock: + if not self._handshake_done: + await self._do_handshake(request) + + try: + stream_id = self._quic_conn.get_next_available_stream_id() + self._events[stream_id] = [] + except BaseException: # pragma: nocover + assert False, "Unexpected exception" + + try: + kwargs = {"request": request, "stream_id": stream_id} + async with Trace("send_request_headers", logger, request, kwargs): + await self._send_request_headers(request=request, stream_id=stream_id) + async with Trace("send_request_body", logger, request, kwargs): + await self._send_request_body(request=request, stream_id=stream_id) + async with Trace( + "receive_response_headers", logger, request, kwargs + ) as trace: + status, headers, stream_ended = await self._receive_response( + request=request, stream_id=stream_id + ) + trace.return_value = (status, headers) + + return Response( + status=status, + headers=headers, + content=HTTP3ConnectionByteStream( + self, request, stream_id=stream_id, is_empty=stream_ended + ), + extensions={ + "http_version": b"HTTP/3", + "network_stream": self._network_stream, + "stream_id": stream_id, + }, + ) + except BaseException as exc: # noqa: PIE786 + with AsyncShieldCancellation(): + kwargs = {"stream_id": stream_id} + async with Trace("response_closed", logger, request, kwargs): + await self._response_closed(stream_id=stream_id) + + if isinstance(exc, h3_exceptions.H3Error): + if self._connection_terminated: # pragma: nocover + raise RemoteProtocolError(self._connection_terminated) + raise LocalProtocolError(exc) # pragma: nocover + + raise exc + + # Sending the request... + + async def _do_handshake(self, request: Request) -> None: + assert hasattr(self._network_stream, "_addr") + self._quic_conn.connect(addr=self._network_stream._addr, now=monotonic()) + while not self._handshake_done: + await self._write_outgoing_data(request) + await self._read_incoming_data(request) + + async def _send_request_headers(self, request: Request, stream_id: int) -> None: + """ + Send the request headers to a given stream ID. + """ + end_stream = not has_body_headers(request) + + # In HTTP/3 the ':authority' pseudo-header is used instead of 'Host'. + # In order to gracefully handle HTTP/1.1 and HTTP/3 we always require + # HTTP/1.1 style headers, and map them appropriately if we end up on + # an HTTP/3 connection. + authority = [v for k, v in request.headers if k.lower() == b"host"][0] + + headers = [ + (b":method", request.method), + (b":authority", authority), + (b":scheme", request.url.scheme), + (b":path", request.url.target), + ] + [ + (k.lower(), v) + for k, v in request.headers + if k.lower() + not in ( + b"host", + b"transfer-encoding", + ) + ] + + self._h3_state.send_headers(stream_id, headers, end_stream=end_stream) + await self._write_outgoing_data(request) + + async def _send_request_body(self, request: Request, stream_id: int) -> None: + """ + Iterate over the request body sending it to a given stream ID. + """ + if not has_body_headers(request): + return + + assert isinstance(request.stream, typing.AsyncIterable) + async for data in request.stream: + await self._send_stream_data(request, stream_id, data) + await self._send_end_stream(request, stream_id) + + async def _send_stream_data( + self, request: Request, stream_id: int, data: bytes + ) -> None: + """ + Send a single chunk of data in one or more data frames. + """ + self._h3_state.send_data(stream_id=stream_id, data=data, end_stream=False) + await self._write_outgoing_data(request) + + async def _send_end_stream(self, request: Request, stream_id: int) -> None: + """ + Send an empty data frame on on a given stream ID with the END_STREAM flag set. + """ + self._h3_state.send_data(stream_id=stream_id, data=b"", end_stream=True) + await self._write_outgoing_data(request) + + # Receiving the response... + + async def _receive_response( + self, request: Request, stream_id: int + ) -> typing.Tuple[int, typing.List[typing.Tuple[bytes, bytes]]]: + """ + Return the response status code and headers for a given stream ID. + """ + while True: + event = await self._receive_stream_event(request, stream_id) + if isinstance(event, h3_events.HeadersReceived): + break + + status_code = 200 + headers = [] + for k, v in event.headers: + if k == b":status": + status_code = int(v.decode("ascii", errors="ignore")) + elif not k.startswith(b":"): + headers.append((k, v)) + + return (status_code, headers, event.stream_ended) + + async def _receive_response_body( + self, request: Request, stream_id: int + ) -> typing.AsyncIterator[bytes]: + """ + Iterator that returns the bytes of the response body for a given stream ID. + """ + while True: + event = await self._receive_stream_event(request, stream_id) + if isinstance(event, h3_events.DataReceived): + if event.stream_ended: + break + + await self._write_outgoing_data(request) + yield event.data + + async def _receive_stream_event( + self, request: Request, stream_id: int + ) -> typing.Union[h3_events.HeadersReceived, h3_events.DatagramReceived]: + """ + Return the next available event for a given stream ID. + + Will read more data from the network if required. + """ + while not self._events.get(stream_id): + await self._receive_events(request, stream_id) + event = self._events[stream_id].pop(0) + if isinstance(event, quic_events.StreamReset): + raise RemoteProtocolError(event) + return event + + async def _receive_events( + self, request: Request, stream_id: typing.Optional[int] = None + ) -> None: + """ + Read some data from the network until we see one or more events + for a given stream ID. + """ + + async with self._read_lock: + if self._connection_terminated is not None: + raise RemoteProtocolError(self._connection_terminated) + + # This conditional is a bit icky. We don't want to block reading if we've + # actually got an event to return for a given stream. We need to do that + # check *within* the atomic read lock. + if stream_id is None or not self._events.get(stream_id): + events = await self._read_incoming_data(request) + for event in events: + if isinstance( + event, + ( + h3_events.HeadersReceived, + h3_events.DataReceived, + ), + ): + if event.stream_id in self._events: + self._events[event.stream_id].append(event) + + elif isinstance(event, quic_events.ConnectionTerminated): + self._connection_terminated = event + + await self._write_outgoing_data(request) + + async def _response_closed(self, stream_id: int) -> None: + del self._events[stream_id] + async with self._state_lock: + if self._connection_terminated and not self._events: + await self.aclose() + + elif self._state == HTTPConnectionState.ACTIVE and not self._events: + self._state = HTTPConnectionState.IDLE + if self._keepalive_expiry is not None: + now = time.monotonic() + self._expire_at = now + self._keepalive_expiry + if self._used_all_stream_ids: # pragma: nocover + await self.aclose() + + async def aclose(self) -> None: + # Note that this method unilaterally closes the connection, and does + # not have any kind of locking in place around it. + self._quic_conn.close() + self._state = HTTPConnectionState.CLOSED + await self._network_stream.aclose() + + # Wrappers around network read/write operations... + + async def _read_incoming_data( + self, request: Request + ) -> typing.List[h3_events.H3Event]: + timeouts = request.extensions.get("timeout", {}) + timeout = timeouts.get("read", None) + + if self._read_exception is not None: + raise self._read_exception # pragma: nocover + + try: + data = await self._network_stream.read(self.READ_NUM_BYTES, timeout) + if data == b"": + raise RemoteProtocolError("Server disconnected") + except Exception as exc: + # If we get a network error we should: + # + # 1. Save the exception and just raise it immediately on any future reads. + # (For example, this means that a single read timeout or disconnect will + # immediately close all pending streams. Without requiring multiple + # sequential timeouts.) + # 2. Mark the connection as errored, so that we don't accept any other + # incoming requests. + self._read_exception = exc + self._connection_error = True + raise exc + + self._quic_conn.receive_datagram( + data=data, addr=self._network_stream._addr, now=time.monotonic() + ) + + events: typing.List[h3_events.H3Event] = [] + quic_event = self._quic_conn.next_event() + + while quic_event: + if isinstance(quic_event, quic_events.HandshakeCompleted): + self._handshake_done = True + + # elif isinstance(quic_event, quic_events.StreamDataReceived): + + events.extend(self._h3_state.handle_event(quic_event)) + quic_event = self._quic_conn.next_event() + + return events + + async def _write_outgoing_data(self, request: Request) -> None: + timeouts = request.extensions.get("timeout", {}) + timeout = timeouts.get("write", None) + + async with self._write_lock: + for data_to_send, _ in self._quic_conn.datagrams_to_send(now=monotonic()): + if self._write_exception is not None: + raise self._write_exception # pragma: nocover + + try: + await self._network_stream.write(data_to_send, timeout) + except Exception as exc: # pragma: nocover + # If we get a network error we should: + # + # 1. Save the exception and just raise it immediately on any future write. + # (For example, this means that a single write timeout or disconnect will + # immediately close all pending streams. Without requiring multiple + # sequential timeouts.) + # 2. Mark the connection as errored, so that we don't accept any other + # incoming requests. + self._write_exception = exc + self._connection_error = True + raise exc + + # Interface for connection pooling... + + def can_handle_request(self, origin: Origin) -> bool: + return origin == self._origin + + def is_available(self) -> bool: + return ( + self._state != HTTPConnectionState.CLOSED + and not self._connection_error + and not self._used_all_stream_ids + and not (self._quic_conn._state == QuicConnectionState.CLOSING) + ) + + def has_expired(self) -> bool: + now = time.monotonic() + return self._expire_at is not None and now > self._expire_at + + def is_idle(self) -> bool: + return self._state == HTTPConnectionState.IDLE + + def is_closed(self) -> bool: + return self._state == HTTPConnectionState.CLOSED + + def info(self) -> str: + origin = str(self._origin) + return ( + f"{origin!r}, HTTP/3, {self._state.name}, " + f"Request Count: {self._request_count}" + ) + + def __repr__(self) -> str: + class_name = self.__class__.__name__ + origin = str(self._origin) + return ( + f"<{class_name} [{origin!r}, {self._state.name}, " + f"Request Count: {self._request_count}]>" + ) + + # These context managers are not used in the standard flow, but are + # useful for testing or working with connection instances directly. + + async def __aenter__(self) -> "AsyncHTTP3Connection": + return self + + async def __aexit__( + self, + exc_type: typing.Optional[typing.Type[BaseException]] = None, + exc_value: typing.Optional[BaseException] = None, + traceback: typing.Optional[types.TracebackType] = None, + ) -> None: + await self.aclose() + + +class HTTP3ConnectionByteStream: + def __init__( + self, + connection: AsyncHTTP3Connection, + request: Request, + stream_id: int, + is_empty: bool, + ) -> None: + self._connection = connection + self._request = request + self._stream_id = stream_id + self._closed = False + self._is_empty = is_empty + + async def __aiter__(self) -> typing.AsyncIterator[bytes]: + kwargs = {"request": self._request, "stream_id": self._stream_id} + try: + if not self._is_empty: + async with Trace( + "receive_response_body", logger, self._request, kwargs + ): + async for chunk in self._connection._receive_response_body( + request=self._request, stream_id=self._stream_id + ): + yield chunk + except BaseException as exc: + # If we get an exception while streaming the response, + # we want to close the response (and possibly the connection) + # before raising that exception. + with AsyncShieldCancellation(): + await self.aclose() + raise exc + + async def aclose(self) -> None: + if not self._closed: + self._closed = True + kwargs = {"stream_id": self._stream_id} + async with Trace("response_closed", logger, self._request, kwargs): + await self._connection._response_closed(stream_id=self._stream_id) diff --git a/httpcore/_backends/base.py b/httpcore/_backends/base.py index 6cadedb5..2f80fbf9 100644 --- a/httpcore/_backends/base.py +++ b/httpcore/_backends/base.py @@ -37,8 +37,13 @@ def connect_tcp( host: str, port: int, timeout: typing.Optional[float] = None, - local_address: typing.Optional[str] = None, - socket_options: typing.Optional[typing.Iterable[SOCKET_OPTION]] = None, + ) -> NetworkStream: + raise NotImplementedError() # pragma: nocover + + def connect_udp( + self, + host: str, + port: int, ) -> NetworkStream: raise NotImplementedError() # pragma: nocover @@ -91,6 +96,13 @@ async def connect_tcp( ) -> AsyncNetworkStream: raise NotImplementedError() # pragma: nocover + async def connect_udp( + self, + host: str, + port: int, + ) -> AsyncNetworkStream: + raise NotImplementedError() # pragma: nocover + async def connect_unix_socket( self, path: str, diff --git a/httpcore/_backends/sync.py b/httpcore/_backends/sync.py index 7b7b417d..7052bfe4 100644 --- a/httpcore/_backends/sync.py +++ b/httpcore/_backends/sync.py @@ -18,6 +18,56 @@ from .base import SOCKET_OPTION, NetworkBackend, NetworkStream +class SyncUDPStream(NetworkStream): + def __init__( + self, sock: socket.socket, addr: typing.Tuple[str, int, int, int] + ) -> None: + self._sock = sock + self._addr = addr + + def read(self, max_bytes: int, timeout: typing.Optional[float] = None) -> bytes: + exc_map: ExceptionMapping = {socket.timeout: ReadTimeout, OSError: ReadError} + with map_exceptions(exc_map): + self._sock.settimeout(timeout) + data = self._sock.recvfrom(max_bytes)[0] + return data + + def write(self, buffer: bytes, timeout: typing.Optional[float] = None) -> None: + if not buffer: + return + + exc_map: ExceptionMapping = {socket.timeout: WriteTimeout, OSError: WriteError} + with map_exceptions(exc_map): + while buffer: + self._sock.settimeout(timeout) + n = self._sock.sendto(buffer, self._addr) + buffer = buffer[n:] + + def close(self) -> None: + self._sock.close() + + def start_tls( + self, + ssl_context: ssl.SSLContext, + server_hostname: typing.Optional[str] = None, + timeout: typing.Optional[float] = None, + ) -> NetworkStream: + raise NotImplementedError() + + def get_extra_info(self, info: str) -> typing.Any: + if info == "ssl_object" and isinstance(self._sock, ssl.SSLSocket): + return self._sock._sslobj # type: ignore + if info == "client_addr": + return self._sock.getsockname() + if info == "server_addr": + return self._sock.getpeername() + if info == "socket": + return self._sock + if info == "is_readable": + return is_socket_readable(self._sock) + return None + + class TLSinTLSStream(NetworkStream): # pragma: no cover """ Because the standard `SSLContext.wrap_socket` method does @@ -213,6 +263,23 @@ def connect_tcp( sock.setsockopt(socket.IPPROTO_TCP, socket.TCP_NODELAY, 1) return SyncStream(sock) + def connect_udp( + self, + host: str, + port: int, + ) -> NetworkStream: + infos = socket.getaddrinfo(host, port, type=socket.SOCK_DGRAM) + addr: typing.Any = infos[0][4] + + if len(addr) == 2: + addr = ("::ffff:" + addr[0], addr[1], 0, 0) + + sock = socket.socket(socket.AF_INET6, socket.SOCK_DGRAM) + sock.setsockopt(socket.IPPROTO_IPV6, socket.IPV6_V6ONLY, 0) + sock.bind(("::", 0, 0, 0)) + + return SyncUDPStream(sock=sock, addr=addr) + def connect_unix_socket( self, path: str, diff --git a/httpcore/_sync/__init__.py b/httpcore/_sync/__init__.py index b476d76d..30e47bce 100644 --- a/httpcore/_sync/__init__.py +++ b/httpcore/_sync/__init__.py @@ -16,6 +16,18 @@ def __init__(self, *args, **kwargs) -> None: # type: ignore ) +try: + from .http3 import HTTP3Connection +except ImportError: # pragma: nocover + + class HTTP3Connection: # type: ignore + def __init__(self, *args, **kwargs) -> None: # type: ignore + raise RuntimeError( + "Attempted to use http3 support, but the `aioquic` package is not " + "installed. Use 'pip install httpcore[http3]'." + ) + + try: from .socks_proxy import SOCKSProxy except ImportError: # pragma: nocover @@ -34,6 +46,7 @@ def __init__(self, *args, **kwargs) -> None: # type: ignore "HTTPProxy", "HTTP11Connection", "HTTP2Connection", + "HTTP3Connection", "ConnectionInterface", "SOCKSProxy", ] diff --git a/httpcore/_sync/connection.py b/httpcore/_sync/connection.py index c3890f34..d1a16940 100644 --- a/httpcore/_sync/connection.py +++ b/httpcore/_sync/connection.py @@ -41,6 +41,7 @@ def __init__( keepalive_expiry: Optional[float] = None, http1: bool = True, http2: bool = False, + http3: bool = False, retries: int = 0, local_address: Optional[str] = None, uds: Optional[str] = None, @@ -52,6 +53,7 @@ def __init__( self._keepalive_expiry = keepalive_expiry self._http1 = http1 self._http2 = http2 + self._http3 = http3 self._retries = retries self._local_address = local_address self._uds = uds @@ -80,7 +82,18 @@ def handle_request(self, request: Request) -> Response: ssl_object is not None and ssl_object.selected_alpn_protocol() == "h2" ) - if http2_negotiated or (self._http2 and not self._http1): + if self._http3 and not ( + self._http1 or self._http2 + ): # pragma: no cover + from .http3 import HTTP3Connection + + stream = self._connect_http3(request) + self._connection = HTTP3Connection( + origin=self._origin, + stream=stream, + keepalive_expiry=self._keepalive_expiry, + ) + elif http2_negotiated or (self._http2 and not self._http1): from .http2 import HTTP2Connection self._connection = HTTP2Connection( @@ -162,6 +175,30 @@ def _connect(self, request: Request) -> NetworkStream: with Trace("retry", logger, request, kwargs) as trace: self._network_backend.sleep(delay) + def _connect_http3( + self, request: Request + ) -> NetworkStream: # pragma: nocover + retries_left = self._retries + delays = exponential_backoff(factor=RETRIES_BACKOFF_FACTOR) + + while True: + try: + kwargs = { + "host": self._origin.host.decode("ascii"), + "port": self._origin.port, + } + with Trace("connect_udp", logger, request, kwargs) as trace: + stream = self._network_backend.connect_udp(**kwargs) # type: ignore + trace.return_value = stream + return stream + except (ConnectError, ConnectTimeout): + if retries_left <= 0: + raise + retries_left -= 1 + delay = next(delays) + with Trace("retry", logger, request, kwargs) as trace: + self._network_backend.sleep(delay) + def can_handle_request(self, origin: Origin) -> bool: return origin == self._origin diff --git a/httpcore/_sync/connection_pool.py b/httpcore/_sync/connection_pool.py index 01bec59e..8264e107 100644 --- a/httpcore/_sync/connection_pool.py +++ b/httpcore/_sync/connection_pool.py @@ -53,6 +53,7 @@ def __init__( keepalive_expiry: Optional[float] = None, http1: bool = True, http2: bool = False, + http3: bool = False, retries: int = 0, local_address: Optional[str] = None, uds: Optional[str] = None, @@ -77,6 +78,8 @@ def __init__( by the connection pool. Defaults to True. http2: A boolean indicating if HTTP/2 requests should be supported by the connection pool. Defaults to False. + http3: A boolean indicating if HTTP/3 requests should be supported by + the connection pool. Defaults to False. retries: The maximum number of retries when trying to establish a connection. local_address: Local address to connect from. Can also be used to connect @@ -105,6 +108,7 @@ def __init__( self._keepalive_expiry = keepalive_expiry self._http1 = http1 self._http2 = http2 + self._http3 = http3 self._retries = retries self._local_address = local_address self._uds = uds @@ -131,6 +135,7 @@ def create_connection(self, origin: Origin) -> ConnectionInterface: keepalive_expiry=self._keepalive_expiry, http1=self._http1, http2=self._http2, + http3=self._http3, retries=self._retries, local_address=self._local_address, uds=self._uds, diff --git a/httpcore/_sync/http3.py b/httpcore/_sync/http3.py new file mode 100644 index 00000000..a0fe8292 --- /dev/null +++ b/httpcore/_sync/http3.py @@ -0,0 +1,497 @@ +import enum +import logging +import time +import types +import typing +from time import monotonic + +import certifi +from aioquic.h3 import events as h3_events, exceptions as h3_exceptions +from aioquic.h3.connection import H3Connection +from aioquic.quic import events as quic_events +from aioquic.quic.configuration import QuicConfiguration +from aioquic.quic.connection import QuicConnection, QuicConnectionState + +from .._backends.base import NetworkStream +from .._exceptions import ( + ConnectionNotAvailable, + LocalProtocolError, + RemoteProtocolError, +) +from .._models import Origin, Request, Response +from .._synchronization import Lock, ShieldCancellation +from .._trace import Trace +from .interfaces import ConnectionInterface + +logger = logging.getLogger("httpcore.http3") + + +def has_body_headers(request: Request) -> bool: + return any( + k.lower() == b"content-length" or k.lower() == b"transfer-encoding" + for k, v in request.headers + ) + + +class HTTPConnectionState(enum.IntEnum): + ACTIVE = 1 + IDLE = 2 + CLOSED = 3 + + +class HTTP3Connection(ConnectionInterface): + READ_NUM_BYTES = 64 * 1024 + + def __init__( + self, + origin: Origin, + stream: NetworkStream, + keepalive_expiry: typing.Optional[float] = None, + ): + quic_configuration = QuicConfiguration( + alpn_protocols=["h3", "h3-32", "h3-31", "h3-30", "h3-29"], + is_client=True, + ) + quic_configuration.server_name = origin.host.decode("ascii") + quic_configuration.cafile = certifi.where() + + self._origin = origin + self._network_stream = stream + self._keepalive_expiry: typing.Optional[float] = keepalive_expiry + self._quic_conn = QuicConnection(configuration=quic_configuration) + self._h3_state = H3Connection(quic=self._quic_conn) + self._state = HTTPConnectionState.IDLE + self._expire_at: typing.Optional[float] = None + self._request_count = 0 + self._state_lock = Lock() + self._read_lock = Lock() + self._write_lock = Lock() + self._handshake_lock = Lock() + self._handshake_done = False + self._sent_connection_init = False + self._used_all_stream_ids = False + self._connection_error = False + + # Mapping from stream ID to response stream events. + self._events: typing.Dict[ + int, + typing.Union[ + h3_events.ResponseReceived, + h3_events.DataReceived, + quic_events.StreamReset, + ], + ] = {} + + # Connection terminated events are stored as state since + # we need to handle them for all streams. + self._connection_terminated: typing.Optional[ + quic_events.ConnectionTerminated + ] = None + + self._read_exception: typing.Optional[Exception] = None + self._write_exception: typing.Optional[Exception] = None + + def handle_request(self, request: Request) -> Response: + if not self.can_handle_request(request.url.origin): + # This cannot occur in normal operation, since the connection pool + # will only send requests on connections that handle them. + # It's in place simply for resilience as a guard against incorrect + # usage, for anyone working directly with httpcore connections. + raise RuntimeError( + f"Attempted to send request to {request.url.origin} on connection " + f"to {self._origin}" + ) + + with self._state_lock: + if self._state in (HTTPConnectionState.ACTIVE, HTTPConnectionState.IDLE): + self._request_count += 1 + self._expire_at = None + self._state = HTTPConnectionState.ACTIVE + else: + raise ConnectionNotAvailable() + + with self._handshake_lock: + if not self._handshake_done: + self._do_handshake(request) + + try: + stream_id = self._quic_conn.get_next_available_stream_id() + self._events[stream_id] = [] + except BaseException: # pragma: nocover + assert False, "Unexpected exception" + + try: + kwargs = {"request": request, "stream_id": stream_id} + with Trace("send_request_headers", logger, request, kwargs): + self._send_request_headers(request=request, stream_id=stream_id) + with Trace("send_request_body", logger, request, kwargs): + self._send_request_body(request=request, stream_id=stream_id) + with Trace( + "receive_response_headers", logger, request, kwargs + ) as trace: + status, headers, stream_ended = self._receive_response( + request=request, stream_id=stream_id + ) + trace.return_value = (status, headers) + + return Response( + status=status, + headers=headers, + content=HTTP3ConnectionByteStream( + self, request, stream_id=stream_id, is_empty=stream_ended + ), + extensions={ + "http_version": b"HTTP/3", + "network_stream": self._network_stream, + "stream_id": stream_id, + }, + ) + except BaseException as exc: # noqa: PIE786 + with ShieldCancellation(): + kwargs = {"stream_id": stream_id} + with Trace("response_closed", logger, request, kwargs): + self._response_closed(stream_id=stream_id) + + if isinstance(exc, h3_exceptions.H3Error): + if self._connection_terminated: # pragma: nocover + raise RemoteProtocolError(self._connection_terminated) + raise LocalProtocolError(exc) # pragma: nocover + + raise exc + + # Sending the request... + + def _do_handshake(self, request: Request) -> None: + assert hasattr(self._network_stream, "_addr") + self._quic_conn.connect(addr=self._network_stream._addr, now=monotonic()) + while not self._handshake_done: + self._write_outgoing_data(request) + self._read_incoming_data(request) + + def _send_request_headers(self, request: Request, stream_id: int) -> None: + """ + Send the request headers to a given stream ID. + """ + end_stream = not has_body_headers(request) + + # In HTTP/3 the ':authority' pseudo-header is used instead of 'Host'. + # In order to gracefully handle HTTP/1.1 and HTTP/3 we always require + # HTTP/1.1 style headers, and map them appropriately if we end up on + # an HTTP/3 connection. + authority = [v for k, v in request.headers if k.lower() == b"host"][0] + + headers = [ + (b":method", request.method), + (b":authority", authority), + (b":scheme", request.url.scheme), + (b":path", request.url.target), + ] + [ + (k.lower(), v) + for k, v in request.headers + if k.lower() + not in ( + b"host", + b"transfer-encoding", + ) + ] + + self._h3_state.send_headers(stream_id, headers, end_stream=end_stream) + self._write_outgoing_data(request) + + def _send_request_body(self, request: Request, stream_id: int) -> None: + """ + Iterate over the request body sending it to a given stream ID. + """ + if not has_body_headers(request): + return + + assert isinstance(request.stream, typing.Iterable) + for data in request.stream: + self._send_stream_data(request, stream_id, data) + self._send_end_stream(request, stream_id) + + def _send_stream_data( + self, request: Request, stream_id: int, data: bytes + ) -> None: + """ + Send a single chunk of data in one or more data frames. + """ + self._h3_state.send_data(stream_id=stream_id, data=data, end_stream=False) + self._write_outgoing_data(request) + + def _send_end_stream(self, request: Request, stream_id: int) -> None: + """ + Send an empty data frame on on a given stream ID with the END_STREAM flag set. + """ + self._h3_state.send_data(stream_id=stream_id, data=b"", end_stream=True) + self._write_outgoing_data(request) + + # Receiving the response... + + def _receive_response( + self, request: Request, stream_id: int + ) -> typing.Tuple[int, typing.List[typing.Tuple[bytes, bytes]]]: + """ + Return the response status code and headers for a given stream ID. + """ + while True: + event = self._receive_stream_event(request, stream_id) + if isinstance(event, h3_events.HeadersReceived): + break + + status_code = 200 + headers = [] + for k, v in event.headers: + if k == b":status": + status_code = int(v.decode("ascii", errors="ignore")) + elif not k.startswith(b":"): + headers.append((k, v)) + + return (status_code, headers, event.stream_ended) + + def _receive_response_body( + self, request: Request, stream_id: int + ) -> typing.Iterator[bytes]: + """ + Iterator that returns the bytes of the response body for a given stream ID. + """ + while True: + event = self._receive_stream_event(request, stream_id) + if isinstance(event, h3_events.DataReceived): + if event.stream_ended: + break + + self._write_outgoing_data(request) + yield event.data + + def _receive_stream_event( + self, request: Request, stream_id: int + ) -> typing.Union[h3_events.HeadersReceived, h3_events.DatagramReceived]: + """ + Return the next available event for a given stream ID. + + Will read more data from the network if required. + """ + while not self._events.get(stream_id): + self._receive_events(request, stream_id) + event = self._events[stream_id].pop(0) + if isinstance(event, quic_events.StreamReset): + raise RemoteProtocolError(event) + return event + + def _receive_events( + self, request: Request, stream_id: typing.Optional[int] = None + ) -> None: + """ + Read some data from the network until we see one or more events + for a given stream ID. + """ + + with self._read_lock: + if self._connection_terminated is not None: + raise RemoteProtocolError(self._connection_terminated) + + # This conditional is a bit icky. We don't want to block reading if we've + # actually got an event to return for a given stream. We need to do that + # check *within* the atomic read lock. + if stream_id is None or not self._events.get(stream_id): + events = self._read_incoming_data(request) + for event in events: + if isinstance( + event, + ( + h3_events.HeadersReceived, + h3_events.DataReceived, + ), + ): + if event.stream_id in self._events: + self._events[event.stream_id].append(event) + + elif isinstance(event, quic_events.ConnectionTerminated): + self._connection_terminated = event + + self._write_outgoing_data(request) + + def _response_closed(self, stream_id: int) -> None: + del self._events[stream_id] + with self._state_lock: + if self._connection_terminated and not self._events: + self.close() + + elif self._state == HTTPConnectionState.ACTIVE and not self._events: + self._state = HTTPConnectionState.IDLE + if self._keepalive_expiry is not None: + now = time.monotonic() + self._expire_at = now + self._keepalive_expiry + if self._used_all_stream_ids: # pragma: nocover + self.close() + + def close(self) -> None: + # Note that this method unilaterally closes the connection, and does + # not have any kind of locking in place around it. + self._quic_conn.close() + self._state = HTTPConnectionState.CLOSED + self._network_stream.close() + + # Wrappers around network read/write operations... + + def _read_incoming_data( + self, request: Request + ) -> typing.List[h3_events.H3Event]: + timeouts = request.extensions.get("timeout", {}) + timeout = timeouts.get("read", None) + + if self._read_exception is not None: + raise self._read_exception # pragma: nocover + + try: + data = self._network_stream.read(self.READ_NUM_BYTES, timeout) + if data == b"": + raise RemoteProtocolError("Server disconnected") + except Exception as exc: + # If we get a network error we should: + # + # 1. Save the exception and just raise it immediately on any future reads. + # (For example, this means that a single read timeout or disconnect will + # immediately close all pending streams. Without requiring multiple + # sequential timeouts.) + # 2. Mark the connection as errored, so that we don't accept any other + # incoming requests. + self._read_exception = exc + self._connection_error = True + raise exc + + self._quic_conn.receive_datagram( + data=data, addr=self._network_stream._addr, now=time.monotonic() + ) + + events: typing.List[h3_events.H3Event] = [] + quic_event = self._quic_conn.next_event() + + while quic_event: + if isinstance(quic_event, quic_events.HandshakeCompleted): + self._handshake_done = True + + # elif isinstance(quic_event, quic_events.StreamDataReceived): + + events.extend(self._h3_state.handle_event(quic_event)) + quic_event = self._quic_conn.next_event() + + return events + + def _write_outgoing_data(self, request: Request) -> None: + timeouts = request.extensions.get("timeout", {}) + timeout = timeouts.get("write", None) + + with self._write_lock: + for data_to_send, _ in self._quic_conn.datagrams_to_send(now=monotonic()): + if self._write_exception is not None: + raise self._write_exception # pragma: nocover + + try: + self._network_stream.write(data_to_send, timeout) + except Exception as exc: # pragma: nocover + # If we get a network error we should: + # + # 1. Save the exception and just raise it immediately on any future write. + # (For example, this means that a single write timeout or disconnect will + # immediately close all pending streams. Without requiring multiple + # sequential timeouts.) + # 2. Mark the connection as errored, so that we don't accept any other + # incoming requests. + self._write_exception = exc + self._connection_error = True + raise exc + + # Interface for connection pooling... + + def can_handle_request(self, origin: Origin) -> bool: + return origin == self._origin + + def is_available(self) -> bool: + return ( + self._state != HTTPConnectionState.CLOSED + and not self._connection_error + and not self._used_all_stream_ids + and not (self._quic_conn._state == QuicConnectionState.CLOSING) + ) + + def has_expired(self) -> bool: + now = time.monotonic() + return self._expire_at is not None and now > self._expire_at + + def is_idle(self) -> bool: + return self._state == HTTPConnectionState.IDLE + + def is_closed(self) -> bool: + return self._state == HTTPConnectionState.CLOSED + + def info(self) -> str: + origin = str(self._origin) + return ( + f"{origin!r}, HTTP/3, {self._state.name}, " + f"Request Count: {self._request_count}" + ) + + def __repr__(self) -> str: + class_name = self.__class__.__name__ + origin = str(self._origin) + return ( + f"<{class_name} [{origin!r}, {self._state.name}, " + f"Request Count: {self._request_count}]>" + ) + + # These context managers are not used in the standard flow, but are + # useful for testing or working with connection instances directly. + + def __enter__(self) -> "HTTP3Connection": + return self + + def __exit__( + self, + exc_type: typing.Optional[typing.Type[BaseException]] = None, + exc_value: typing.Optional[BaseException] = None, + traceback: typing.Optional[types.TracebackType] = None, + ) -> None: + self.close() + + +class HTTP3ConnectionByteStream: + def __init__( + self, + connection: HTTP3Connection, + request: Request, + stream_id: int, + is_empty: bool, + ) -> None: + self._connection = connection + self._request = request + self._stream_id = stream_id + self._closed = False + self._is_empty = is_empty + + def __iter__(self) -> typing.Iterator[bytes]: + kwargs = {"request": self._request, "stream_id": self._stream_id} + try: + if not self._is_empty: + with Trace( + "receive_response_body", logger, self._request, kwargs + ): + for chunk in self._connection._receive_response_body( + request=self._request, stream_id=self._stream_id + ): + yield chunk + except BaseException as exc: + # If we get an exception while streaming the response, + # we want to close the response (and possibly the connection) + # before raising that exception. + with ShieldCancellation(): + self.close() + raise exc + + def close(self) -> None: + if not self._closed: + self._closed = True + kwargs = {"stream_id": self._stream_id} + with Trace("response_closed", logger, self._request, kwargs): + self._connection._response_closed(stream_id=self._stream_id) diff --git a/pyproject.toml b/pyproject.toml index 85c78740..279253ce 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -37,6 +37,11 @@ dependencies = [ http2 = [ "h2>=3,<5", ] + +http3 = [ + "aioquic>=0.9.21", +] + socks = [ "socksio==1.*", ] @@ -73,6 +78,7 @@ path = "README.md" path = "CHANGELOG.md" [tool.mypy] +exclude = ['httpcore/_async/http3', 'httpcore/_sync/http3'] strict = true show_error_codes = true @@ -97,7 +103,10 @@ filterwarnings = ["error"] [tool.coverage.run] omit = [ "venv/*", - "httpcore/_sync/*" + "httpcore/_sync/*", + "httpcore/_async/http3.py", + "httpcore/_backends/sync.py", + ] include = ["httpcore/*", "tests/*"] diff --git a/requirements.txt b/requirements.txt index ba947170..dbbc166d 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,4 +1,4 @@ --e .[asyncio,trio,http2,socks] +-e .[asyncio,trio,http2,http3,socks] # Docs mkdocs==1.6.0