626 lines
19 KiB
Python
Raw Permalink Normal View History

2025-03-18 00:17:27 +05:30
# -*- coding: utf-8 -*-
"""
hyperframe/frame
~~~~~~~~~~~~~~~~
Defines framing logic for HTTP/2. Provides both classes to represent framed
data and logic for aiding the connection when it comes to reading from the
socket.
"""
import collections
import struct
from .flags import Flag, Flags
# The maximum initial length of a frame. Some frames have shorter maximum lengths.
FRAME_MAX_LEN = (2 ** 14)
# The maximum allowed length of a frame.
FRAME_MAX_ALLOWED_LEN = (2 ** 24) - 1
class Frame(object):
"""
The base class for all HTTP/2 frames.
"""
# The flags defined on this type of frame.
defined_flags = []
# The type of the frame.
type = None
# If 'has-stream', the frame's stream_id must be non-zero. If 'no-stream',
# it must be zero. If 'either', it's not checked.
stream_association = None
def __init__(self, stream_id, flags=()):
self.stream_id = stream_id
self.flags = Flags(self.defined_flags)
self.body_len = 0
for flag in flags:
self.flags.add(flag)
if self.stream_association == 'has-stream' and not self.stream_id:
raise ValueError('Stream ID must be non-zero')
if self.stream_association == 'no-stream' and self.stream_id:
raise ValueError('Stream ID must be zero')
def __repr__(self):
flags = ", ".join(self.flags) or "None"
body = self.serialize_body()
if len(body) > 100:
body = str(body[:100]) + "..."
return (
"{type}(Stream: {stream}; Flags: {flags}): {body}"
).format(type=type(self).__name__, stream=self.stream_id, flags=flags, body=body)
@staticmethod
def parse_frame_header(header):
"""
Takes a 9-byte frame header and returns a tuple of the appropriate
Frame object and the length that needs to be read from the socket.
"""
fields = struct.unpack("!HBBBL", header)
# First 24 bits are frame length.
length = (fields[0] << 8) + fields[1]
type = fields[2]
flags = fields[3]
stream_id = fields[4]
if type not in FRAMES:
raise ValueError("Unknown frame type %d" % type)
frame = FRAMES[type](stream_id)
frame.parse_flags(flags)
return (frame, length)
def parse_flags(self, flag_byte):
for flag, flag_bit in self.defined_flags:
if flag_byte & flag_bit:
self.flags.add(flag)
return self.flags
def serialize(self):
body = self.serialize_body()
self.body_len = len(body)
# Build the common frame header.
# First, get the flags.
flags = 0
for flag, flag_bit in self.defined_flags:
if flag in self.flags:
flags |= flag_bit
header = struct.pack(
"!HBBBL",
(self.body_len & 0xFFFF00) >> 8, # Length is spread over top 24 bits
self.body_len & 0x0000FF,
self.type,
flags,
self.stream_id & 0x7FFFFFFF # Stream ID is 32 bits.
)
return header + body
def serialize_body(self):
raise NotImplementedError()
def parse_body(self, data):
raise NotImplementedError()
class Padding(object):
"""
Mixin for frames that contain padding.
"""
def __init__(self, stream_id, pad_length=0, **kwargs):
super(Padding, self).__init__(stream_id, **kwargs)
self.pad_length = pad_length
def serialize_padding_data(self):
if 'PADDED' in self.flags:
return struct.pack('!B', self.pad_length)
return b''
def parse_padding_data(self, data):
if 'PADDED' in self.flags:
self.pad_length = struct.unpack('!B', data[:1])[0]
return 1
return 0
@property
def total_padding(self):
"""Return the total length of the padding, if any."""
return self.pad_length
class Priority(object):
"""
Mixin for frames that contain priority data.
"""
def __init__(self, stream_id, depends_on=None, stream_weight=None, exclusive=None, **kwargs):
super(Priority, self).__init__(stream_id, **kwargs)
# The stream ID of the stream on which this stream depends.
self.depends_on = depends_on
# The weight of the stream. This is an integer between 0 and 256.
self.stream_weight = stream_weight
# Whether the exclusive bit was set.
self.exclusive = exclusive
def serialize_priority_data(self):
return struct.pack(
"!LB",
self.depends_on | (int(self.exclusive) << 31),
self.stream_weight
)
def parse_priority_data(self, data):
MASK = 0x80000000
self.depends_on, self.stream_weight = struct.unpack(
"!LB", data[:5]
)
self.exclusive = bool(self.depends_on & MASK)
self.depends_on &= ~MASK
return 5
class DataFrame(Padding, Frame):
"""
DATA frames convey arbitrary, variable-length sequences of octets
associated with a stream. One or more DATA frames are used, for instance,
to carry HTTP request or response payloads.
"""
defined_flags = [
Flag('END_STREAM', 0x01),
Flag('PADDED', 0x08),
]
type = 0x0
stream_association = 'has-stream'
def __init__(self, stream_id, data=b'', **kwargs):
super(DataFrame, self).__init__(stream_id, **kwargs)
self.data = data
def serialize_body(self):
padding_data = self.serialize_padding_data()
padding = b'\0' * self.total_padding
return b''.join([padding_data, self.data, padding])
def parse_body(self, data):
padding_data_length = self.parse_padding_data(data)
self.data = data[padding_data_length:len(data)-self.total_padding].tobytes()
self.body_len = len(data)
@property
def flow_controlled_length(self):
"""
If the frame is padded we need to include the padding length byte in
the flow control used.
"""
padding_len = self.total_padding + 1 if self.total_padding else 0
return len(self.data) + padding_len
class PriorityFrame(Priority, Frame):
"""
The PRIORITY frame specifies the sender-advised priority of a stream. It
can be sent at any time for an existing stream. This enables
reprioritisation of existing streams.
"""
defined_flags = []
type = 0x02
stream_association = 'has-stream'
def serialize_body(self):
return self.serialize_priority_data()
def parse_body(self, data):
self.parse_priority_data(data)
self.body_len = len(data)
class RstStreamFrame(Frame):
"""
The RST_STREAM frame allows for abnormal termination of a stream. When sent
by the initiator of a stream, it indicates that they wish to cancel the
stream or that an error condition has occurred. When sent by the receiver
of a stream, it indicates that either the receiver is rejecting the stream,
requesting that the stream be cancelled or that an error condition has
occurred.
"""
defined_flags = []
type = 0x03
stream_association = 'has-stream'
def __init__(self, stream_id, error_code=0, **kwargs):
super(RstStreamFrame, self).__init__(stream_id, **kwargs)
self.error_code = error_code
def serialize_body(self):
return struct.pack("!L", self.error_code)
def parse_body(self, data):
if len(data) != 4:
raise ValueError()
self.error_code = struct.unpack("!L", data)[0]
self.body_len = len(data)
class SettingsFrame(Frame):
"""
The SETTINGS frame conveys configuration parameters that affect how
endpoints communicate. The parameters are either constraints on peer
behavior or preferences.
Settings are not negotiated. Settings describe characteristics of the
sending peer, which are used by the receiving peer. Different values for
the same setting can be advertised by each peer. For example, a client
might set a high initial flow control window, whereas a server might set a
lower value to conserve resources.
"""
defined_flags = [Flag('ACK', 0x01)]
type = 0x04
stream_association = 'no-stream'
# We need to define the known settings, they may as well be class
# attributes.
HEADER_TABLE_SIZE = 0x01
ENABLE_PUSH = 0x02
MAX_CONCURRENT_STREAMS = 0x03
INITIAL_WINDOW_SIZE = 0x04
SETTINGS_MAX_FRAME_SIZE = 0x05
SETTINGS_MAX_HEADER_LIST_SIZE = 0x06
def __init__(self, stream_id=0, settings=None, **kwargs):
super(SettingsFrame, self).__init__(stream_id, **kwargs)
if settings and "ACK" in kwargs.get("flags", ()):
raise ValueError("Settings must be empty if ACK flag is set.")
# A dictionary of the setting type byte to the value.
self.settings = settings or {}
def serialize_body(self):
settings = [struct.pack("!HL", setting & 0xFF, value)
for setting, value in self.settings.items()]
return b''.join(settings)
def parse_body(self, data):
for i in range(0, len(data), 6):
name, value = struct.unpack("!HL", data[i:i+6])
self.settings[name] = value
self.body_len = len(data)
class PushPromiseFrame(Padding, Frame):
"""
The PUSH_PROMISE frame is used to notify the peer endpoint in advance of
streams the sender intends to initiate.
"""
defined_flags = [
Flag('END_HEADERS', 0x04),
Flag('PADDED', 0x08)
]
type = 0x05
stream_association = 'has-stream'
def __init__(self, stream_id, promised_stream_id=0, data=b'', **kwargs):
super(PushPromiseFrame, self).__init__(stream_id, **kwargs)
self.promised_stream_id = promised_stream_id
self.data = data
def serialize_body(self):
padding_data = self.serialize_padding_data()
padding = b'\0' * self.total_padding
data = struct.pack("!L", self.promised_stream_id)
return b''.join([padding_data, data, self.data, padding])
def parse_body(self, data):
padding_data_length = self.parse_padding_data(data)
self.promised_stream_id = struct.unpack("!L", data[padding_data_length:padding_data_length + 4])[0]
self.data = data[padding_data_length + 4:].tobytes()
self.body_len = len(data)
class PingFrame(Frame):
"""
The PING frame is a mechanism for measuring a minimal round-trip time from
the sender, as well as determining whether an idle connection is still
functional. PING frames can be sent from any endpoint.
"""
defined_flags = [Flag('ACK', 0x01)]
type = 0x06
stream_association = 'no-stream'
def __init__(self, stream_id=0, opaque_data=b'', **kwargs):
super(PingFrame, self).__init__(stream_id, **kwargs)
self.opaque_data = opaque_data
def serialize_body(self):
if len(self.opaque_data) > 8:
raise ValueError()
data = self.opaque_data
data += b'\x00' * (8 - len(self.opaque_data))
return data
def parse_body(self, data):
if len(data) > 8:
raise ValueError()
self.opaque_data = data.tobytes()
self.body_len = len(data)
class GoAwayFrame(Frame):
"""
The GOAWAY frame informs the remote peer to stop creating streams on this
connection. It can be sent from the client or the server. Once sent, the
sender will ignore frames sent on new streams for the remainder of the
connection.
"""
type = 0x07
stream_association = 'no-stream'
def __init__(self, stream_id=0, last_stream_id=0, error_code=0, additional_data=b'', **kwargs):
super(GoAwayFrame, self).__init__(stream_id, **kwargs)
self.last_stream_id = last_stream_id
self.error_code = error_code
self.additional_data = additional_data
def serialize_body(self):
data = struct.pack(
"!LL",
self.last_stream_id & 0x7FFFFFFF,
self.error_code
)
data += self.additional_data
return data
def parse_body(self, data):
self.last_stream_id, self.error_code = struct.unpack("!LL", data[:8])
self.body_len = len(data)
if len(data) > 8:
self.additional_data = data[8:].tobytes()
class WindowUpdateFrame(Frame):
"""
The WINDOW_UPDATE frame is used to implement flow control.
Flow control operates at two levels: on each individual stream and on the
entire connection.
Both types of flow control are hop by hop; that is, only between the two
endpoints. Intermediaries do not forward WINDOW_UPDATE frames between
dependent connections. However, throttling of data transfer by any receiver
can indirectly cause the propagation of flow control information toward the
original sender.
"""
type = 0x08
stream_association = 'either'
def __init__(self, stream_id, window_increment=0, **kwargs):
super(WindowUpdateFrame, self).__init__(stream_id, **kwargs)
self.window_increment = window_increment
def serialize_body(self):
return struct.pack("!L", self.window_increment & 0x7FFFFFFF)
def parse_body(self, data):
self.window_increment = struct.unpack("!L", data)[0]
self.body_len = len(data)
class HeadersFrame(Padding, Priority, Frame):
"""
The HEADERS frame carries name-value pairs. It is used to open a stream.
HEADERS frames can be sent on a stream in the "open" or "half closed
(remote)" states.
The HeadersFrame class is actually basically a data frame in this
implementation, because of the requirement to control the sizes of frames.
A header block fragment that doesn't fit in an entire HEADERS frame needs
to be followed with CONTINUATION frames. From the perspective of the frame
building code the header block is an opaque data segment.
"""
type = 0x01
stream_association = 'has-stream'
defined_flags = [
Flag('END_STREAM', 0x01),
Flag('END_HEADERS', 0x04),
Flag('PADDED', 0x08),
Flag('PRIORITY', 0x20),
]
def __init__(self, stream_id, data=b'', **kwargs):
super(HeadersFrame, self).__init__(stream_id, **kwargs)
self.data = data
def serialize_body(self):
padding_data = self.serialize_padding_data()
padding = b'\0' * self.total_padding
if 'PRIORITY' in self.flags:
priority_data = self.serialize_priority_data()
else:
priority_data = b''
return b''.join([padding_data, priority_data, self.data, padding])
def parse_body(self, data):
padding_data_length = self.parse_padding_data(data)
data = data[padding_data_length:]
if 'PRIORITY' in self.flags:
priority_data_length = self.parse_priority_data(data)
else:
priority_data_length = 0
self.body_len = len(data)
self.data = data[priority_data_length:len(data)-self.total_padding].tobytes()
class ContinuationFrame(Frame):
"""
The CONTINUATION frame is used to continue a sequence of header block
fragments. Any number of CONTINUATION frames can be sent on an existing
stream, as long as the preceding frame on the same stream is one of
HEADERS, PUSH_PROMISE or CONTINUATION without the END_HEADERS flag set.
Much like the HEADERS frame, hyper treats this as an opaque data frame with
different flags and a different type.
"""
type = 0x09
stream_association = 'has-stream'
defined_flags = [Flag('END_HEADERS', 0x04),]
def __init__(self, stream_id, data=b'', **kwargs):
super(ContinuationFrame, self).__init__(stream_id, **kwargs)
self.data = data
def serialize_body(self):
return self.data
def parse_body(self, data):
self.data = data.tobytes()
self.body_len = len(data)
Origin = collections.namedtuple('Origin', ['scheme', 'host', 'port'])
class AltSvcFrame(Frame):
"""
The ALTSVC frame is used to advertise alternate services that the current
host, or a different one, can understand.
"""
type = 0xA
stream_association = 'no-stream'
def __init__(self, stream_id=0, host=b'', port=0, protocol_id=b'', max_age=0, origin=None, **kwargs):
super(AltSvcFrame, self).__init__(stream_id, **kwargs)
self.host = host
self.port = port
self.protocol_id = protocol_id
self.max_age = max_age
self.origin = origin
def serialize_origin(self):
if self.origin is not None:
if self.origin.port is None:
hostport = self.origin.host
else:
hostport = self.origin.host + b':' + str(self.origin.port).encode('ascii')
return self.origin.scheme + b'://' + hostport
return b''
def parse_origin(self, data):
if len(data) > 0:
data = data.tobytes()
scheme, hostport = data.split(b'://')
host, _, port = hostport.partition(b':')
self.origin = Origin(scheme=scheme, host=host,
port=int(port) if len(port) > 0 else None)
def serialize_body(self):
first = struct.pack("!LHxB", self.max_age, self.port, len(self.protocol_id))
host_length = struct.pack("!B", len(self.host))
return b''.join([first, self.protocol_id, host_length, self.host,
self.serialize_origin()])
def parse_body(self, data):
self.body_len = len(data)
self.max_age, self.port, protocol_id_length = struct.unpack("!LHxB", data[:8])
pos = 8
self.protocol_id = data[pos:pos+protocol_id_length].tobytes()
pos += protocol_id_length
host_length = struct.unpack("!B", data[pos:pos+1])[0]
pos += 1
self.host = data[pos:pos+host_length].tobytes()
pos += host_length
self.parse_origin(data[pos:])
class BlockedFrame(Frame):
"""
The BLOCKED frame indicates that the sender is unable to send data due to a
closed flow control window.
The BLOCKED frame is used to provide feedback about the performance of flow
control for the purposes of performance tuning and debugging. The BLOCKED
frame can be sent by a peer when flow controlled data cannot be sent due to
the connection- or stream-level flow control. This frame MUST NOT be sent
if there are other reasons preventing data from being sent, either a lack
of available data, or the underlying transport being blocked.
"""
type = 0x0B
stream_association = 'both'
defined_flags = []
def serialize_body(self):
return b''
def parse_body(self, data):
pass
# A map of type byte to frame class.
_FRAME_CLASSES = [
DataFrame,
HeadersFrame,
PriorityFrame,
RstStreamFrame,
SettingsFrame,
PushPromiseFrame,
PingFrame,
GoAwayFrame,
WindowUpdateFrame,
ContinuationFrame,
AltSvcFrame,
BlockedFrame
]
FRAMES = {cls.type: cls for cls in _FRAME_CLASSES}