369 lines
14 KiB
Python
369 lines
14 KiB
Python
|
from __future__ import absolute_import
|
||
|
|
||
|
from base64 import b64encode
|
||
|
from hashlib import sha1
|
||
|
from mimetools import Message
|
||
|
from netlib import tcp
|
||
|
from netlib import utils
|
||
|
from StringIO import StringIO
|
||
|
import os
|
||
|
import SocketServer
|
||
|
import struct
|
||
|
import io
|
||
|
|
||
|
# Colleciton of utility functions that implement small portions of the RFC6455 WebSockets Protocol
|
||
|
# Useful for building WebSocket clients and servers.
|
||
|
#
|
||
|
# Emphassis is on readabilty, simplicity and modularity, not performance or completeness
|
||
|
#
|
||
|
# This is a work in progress and does not yet contain all the utilites need to create fully complient client/servers
|
||
|
#
|
||
|
# Spec: https://tools.ietf.org/html/rfc6455
|
||
|
|
||
|
# The magic sha that websocket servers must know to prove they understand RFC6455
|
||
|
websockets_magic = '258EAFA5-E914-47DA-95CA-C5AB0DC85B11'
|
||
|
|
||
|
class WebSocketFrameValidationException(Exception):
|
||
|
pass
|
||
|
|
||
|
class WebSocketsFrame(object):
|
||
|
"""
|
||
|
Represents one websockets frame.
|
||
|
Constructor takes human readable forms of the frame components
|
||
|
from_bytes() is also avaliable.
|
||
|
|
||
|
WebSockets Frame as defined in RFC6455
|
||
|
|
||
|
0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
|
||
|
+-+-+-+-+-------+-+-------------+-------------------------------+
|
||
|
|F|R|R|R| opcode|M| Payload len | Extended payload length |
|
||
|
|I|S|S|S| (4) |A| (7) | (16/64) |
|
||
|
|N|V|V|V| |S| | (if payload len==126/127) |
|
||
|
| |1|2|3| |K| | |
|
||
|
+-+-+-+-+-------+-+-------------+ - - - - - - - - - - - - - - - +
|
||
|
| Extended payload length continued, if payload len == 127 |
|
||
|
+ - - - - - - - - - - - - - - - +-------------------------------+
|
||
|
| |Masking-key, if MASK set to 1 |
|
||
|
+-------------------------------+-------------------------------+
|
||
|
| Masking-key (continued) | Payload Data |
|
||
|
+-------------------------------- - - - - - - - - - - - - - - - +
|
||
|
: Payload Data continued ... :
|
||
|
+ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - +
|
||
|
| Payload Data continued ... |
|
||
|
+---------------------------------------------------------------+
|
||
|
"""
|
||
|
def __init__(
|
||
|
self,
|
||
|
fin, # decmial integer 1 or 0
|
||
|
opcode, # decmial integer 1 - 4
|
||
|
mask_bit, # decimal integer 1 or 0
|
||
|
payload_length_code, # decimal integer 1 - 127
|
||
|
decoded_payload, # bytestring
|
||
|
rsv1 = 0, # decimal integer 1 or 0
|
||
|
rsv2 = 0, # decimal integer 1 or 0
|
||
|
rsv3 = 0, # decimal integer 1 or 0
|
||
|
payload = None, # bytestring
|
||
|
masking_key = None, # 32 bit byte string
|
||
|
actual_payload_length = None, # any decimal integer
|
||
|
use_validation = True # indicates whether or not you care if this frame adheres to the spec
|
||
|
):
|
||
|
self.fin = fin
|
||
|
self.rsv1 = rsv1
|
||
|
self.rsv2 = rsv2
|
||
|
self.rsv3 = rsv3
|
||
|
self.opcode = opcode
|
||
|
self.mask_bit = mask_bit
|
||
|
self.payload_length_code = payload_length_code
|
||
|
self.masking_key = masking_key
|
||
|
self.payload = payload
|
||
|
self.decoded_payload = decoded_payload
|
||
|
self.actual_payload_length = actual_payload_length
|
||
|
self.use_validation = use_validation
|
||
|
|
||
|
if self.use_validation:
|
||
|
self.validate_frame()
|
||
|
|
||
|
@classmethod
|
||
|
def from_bytes(cls, bytestring):
|
||
|
"""
|
||
|
Construct a websocket frame from an in-memory bytestring
|
||
|
to construct a frame from a stream of bytes, use read_frame() directly
|
||
|
"""
|
||
|
self.from_byte_stream(io.BytesIO(bytestring).read)
|
||
|
|
||
|
@classmethod
|
||
|
def default_frame_from_message(cls, message, from_client = False):
|
||
|
"""
|
||
|
Construct a basic websocket frame from some default values.
|
||
|
Creates a non-fragmented text frame.
|
||
|
"""
|
||
|
length_code, actual_length = get_payload_length_pair(message)
|
||
|
|
||
|
if from_client:
|
||
|
mask_bit = 1
|
||
|
masking_key = random_masking_key()
|
||
|
payload = apply_mask(message, masking_key)
|
||
|
else:
|
||
|
mask_bit = 0
|
||
|
masking_key = None
|
||
|
payload = message
|
||
|
|
||
|
return cls(
|
||
|
fin = 1, # final frame
|
||
|
opcode = 1, # text
|
||
|
mask_bit = mask_bit,
|
||
|
payload_length_code = length_code,
|
||
|
payload = payload,
|
||
|
masking_key = masking_key,
|
||
|
decoded_payload = message,
|
||
|
actual_payload_length = actual_length
|
||
|
)
|
||
|
|
||
|
def validate_frame(self):
|
||
|
"""
|
||
|
Validate websocket frame invariants, call at anytime to ensure the WebSocketsFrame
|
||
|
has not been corrupted.
|
||
|
"""
|
||
|
try:
|
||
|
assert 0 <= self.fin <= 1
|
||
|
assert 0 <= self.rsv1 <= 1
|
||
|
assert 0 <= self.rsv2 <= 1
|
||
|
assert 0 <= self.rsv3 <= 1
|
||
|
assert 1 <= self.opcode <= 4
|
||
|
assert 0 <= self.mask_bit <= 1
|
||
|
assert 1 <= self.payload_length_code <= 127
|
||
|
|
||
|
if self.mask_bit == 1:
|
||
|
assert 1 <= len(self.masking_key) <= 4
|
||
|
else:
|
||
|
assert self.masking_key == None
|
||
|
|
||
|
assert self.actual_payload_length == len(self.payload)
|
||
|
|
||
|
if self.payload is not None and self.masking_key is not None:
|
||
|
apply_mask(self.payload, self.masking_key) == self.decoded_payload
|
||
|
|
||
|
except AssertionError:
|
||
|
raise WebSocketFrameValidationException()
|
||
|
|
||
|
def human_readable(self):
|
||
|
return "\n".join([
|
||
|
("fin - " + str(self.fin)),
|
||
|
("rsv1 - " + str(self.rsv1)),
|
||
|
("rsv2 - " + str(self.rsv2)),
|
||
|
("rsv3 - " + str(self.rsv3)),
|
||
|
("opcode - " + str(self.opcode)),
|
||
|
("mask_bit - " + str(self.mask_bit)),
|
||
|
("payload_length_code - " + str(self.payload_length_code)),
|
||
|
("masking_key - " + str(self.masking_key)),
|
||
|
("payload - " + str(self.payload)),
|
||
|
("decoded_payload - " + str(self.decoded_payload)),
|
||
|
("actual_payload_length - " + str(self.actual_payload_length)),
|
||
|
("use_validation - " + str(self.use_validation))])
|
||
|
|
||
|
def to_bytes(self):
|
||
|
"""
|
||
|
Serialize the frame back into the wire format, returns a bytestring
|
||
|
"""
|
||
|
# validate enforces all the assumptions made by this serializer
|
||
|
# in the spritit of mitmproxy, it's possible to create and serialize invalid frames
|
||
|
# by skipping validation.
|
||
|
if self.use_validation:
|
||
|
self.validate_frame()
|
||
|
|
||
|
max_16_bit_int = (1 << 16)
|
||
|
max_64_bit_int = (1 << 63)
|
||
|
|
||
|
# break down of the bit-math used to construct the first byte from the frame's integer values
|
||
|
# first shift the significant bit into the correct position
|
||
|
# 00000001 << 7 = 10000000
|
||
|
# ...
|
||
|
# then combine:
|
||
|
#
|
||
|
# 10000000 fin
|
||
|
# 01000000 res1
|
||
|
# 00100000 res2
|
||
|
# 00010000 res3
|
||
|
# 00000001 opcode
|
||
|
# -------- OR
|
||
|
# 11110001 = first_byte
|
||
|
|
||
|
first_byte = (self.fin << 7) | (self.rsv1 << 6) | (self.rsv2 << 4) | (self.rsv3 << 4) | self.opcode
|
||
|
|
||
|
second_byte = (self.mask_bit << 7) | self.payload_length_code
|
||
|
|
||
|
bytes = chr(first_byte) + chr(second_byte)
|
||
|
|
||
|
if self.actual_payload_length < 126:
|
||
|
pass
|
||
|
|
||
|
elif self.actual_payload_length < max_16_bit_int:
|
||
|
# '!H' pack as 16 bit unsigned short
|
||
|
bytes += struct.pack('!H', self.actual_payload_length) # add 2 byte extended payload length
|
||
|
|
||
|
elif self.actual_payload_length < max_64_bit_int:
|
||
|
# '!Q' = pack as 64 bit unsigned long long
|
||
|
bytes += struct.pack('!Q', self.actual_payload_length) # add 8 bytes extended payload length
|
||
|
|
||
|
if self.masking_key is not None:
|
||
|
bytes += self.masking_key
|
||
|
|
||
|
bytes += self.payload # already will be encoded if neccessary
|
||
|
|
||
|
return bytes
|
||
|
|
||
|
|
||
|
@classmethod
|
||
|
def from_byte_stream(cls, read_bytes):
|
||
|
"""
|
||
|
read a websockets frame sent by a server or client
|
||
|
|
||
|
read_bytes is a function that can be backed
|
||
|
by sockets or by any byte reader. So this
|
||
|
function may be used to read frames from disk/wire/memory
|
||
|
"""
|
||
|
first_byte = utils.bytes_to_int(read_bytes(1))
|
||
|
second_byte = utils.bytes_to_int(read_bytes(1))
|
||
|
|
||
|
fin = first_byte >> 7 # grab the left most bit
|
||
|
opcode = first_byte & 15 # grab right most 4 bits by and-ing with 00001111
|
||
|
mask_bit = second_byte >> 7 # grab left most bit
|
||
|
payload_length = second_byte & 127 # grab the next 7 bits
|
||
|
|
||
|
# payload_lengthy > 125 indicates you need to read more bytes
|
||
|
# to get the actual payload length
|
||
|
if payload_length <= 125:
|
||
|
actual_payload_length = payload_length
|
||
|
|
||
|
elif payload_length == 126:
|
||
|
actual_payload_length = utils.bytes_to_int(read_bytes(2))
|
||
|
|
||
|
elif payload_length == 127:
|
||
|
actual_payload_length = utils.bytes_to_int(read_bytes(8))
|
||
|
|
||
|
# masking key only present if mask bit set
|
||
|
if mask_bit == 1:
|
||
|
masking_key = read_bytes(4)
|
||
|
else:
|
||
|
masking_key = None
|
||
|
|
||
|
payload = read_bytes(actual_payload_length)
|
||
|
|
||
|
if mask_bit == 1:
|
||
|
decoded_payload = apply_mask(payload, masking_key)
|
||
|
else:
|
||
|
decoded_payload = payload
|
||
|
|
||
|
return cls(
|
||
|
fin = fin,
|
||
|
opcode = opcode,
|
||
|
mask_bit = mask_bit,
|
||
|
payload_length_code = payload_length,
|
||
|
payload = payload,
|
||
|
masking_key = masking_key,
|
||
|
decoded_payload = decoded_payload,
|
||
|
actual_payload_length = actual_payload_length
|
||
|
)
|
||
|
|
||
|
def apply_mask(message, masking_key):
|
||
|
"""
|
||
|
Data sent from the server must be masked to prevent malicious clients
|
||
|
from sending data over the wire in predictable patterns
|
||
|
|
||
|
This method both encodes and decodes strings with the provided mask
|
||
|
|
||
|
Servers do not have to mask data they send to the client.
|
||
|
https://tools.ietf.org/html/rfc6455#section-5.3
|
||
|
"""
|
||
|
masks = [utils.bytes_to_int(byte) for byte in masking_key]
|
||
|
result = ""
|
||
|
for char in message:
|
||
|
result += chr(ord(char) ^ masks[len(result) % 4])
|
||
|
return result
|
||
|
|
||
|
def random_masking_key():
|
||
|
return os.urandom(4)
|
||
|
|
||
|
def masking_key_list(masking_key):
|
||
|
return [utils.bytes_to_int(byte) for byte in masking_key]
|
||
|
|
||
|
def create_client_handshake(host, port, key, version, resource):
|
||
|
"""
|
||
|
WebSockets connections are intiated by the client with a valid HTTP upgrade request
|
||
|
"""
|
||
|
headers = [
|
||
|
('Host', '%s:%s' % (host, port)),
|
||
|
('Connection', 'Upgrade'),
|
||
|
('Upgrade', 'websocket'),
|
||
|
('Sec-WebSocket-Key', key),
|
||
|
('Sec-WebSocket-Version', version)
|
||
|
]
|
||
|
request = "GET %s HTTP/1.1" % resource
|
||
|
return build_handshake(headers, request)
|
||
|
|
||
|
|
||
|
def create_server_handshake(key, magic = websockets_magic):
|
||
|
"""
|
||
|
The server response is a valid HTTP 101 response.
|
||
|
"""
|
||
|
digest = b64encode(sha1(key + magic).hexdigest().decode('hex'))
|
||
|
headers = [
|
||
|
('Connection', 'Upgrade'),
|
||
|
('Upgrade', 'websocket'),
|
||
|
('Sec-WebSocket-Accept', digest)
|
||
|
]
|
||
|
request = "HTTP/1.1 101 Switching Protocols"
|
||
|
return build_handshake(headers, request)
|
||
|
|
||
|
|
||
|
def build_handshake(headers, request):
|
||
|
handshake = [request.encode('utf-8')]
|
||
|
for header, value in headers:
|
||
|
handshake.append(("%s: %s" % (header, value)).encode('utf-8'))
|
||
|
handshake.append(b'\r\n')
|
||
|
return b'\r\n'.join(handshake)
|
||
|
|
||
|
|
||
|
def read_handshake(read_bytes, num_bytes_per_read):
|
||
|
"""
|
||
|
From provided function that reads bytes, read in a
|
||
|
complete HTTP request, which terminates with a CLRF
|
||
|
"""
|
||
|
response = b''
|
||
|
doubleCLRF = b'\r\n\r\n'
|
||
|
while True:
|
||
|
bytes = read_bytes(num_bytes_per_read)
|
||
|
if not bytes:
|
||
|
break
|
||
|
response += bytes
|
||
|
if doubleCLRF in response:
|
||
|
break
|
||
|
return response
|
||
|
|
||
|
def get_payload_length_pair(payload_bytestring):
|
||
|
"""
|
||
|
A websockets frame contains an initial length_code, and an optional
|
||
|
extended length code to represent the actual length if length code is larger
|
||
|
than 125
|
||
|
"""
|
||
|
actual_length = len(payload_bytestring)
|
||
|
|
||
|
if actual_length <= 125:
|
||
|
length_code = actual_length
|
||
|
elif actual_length >= 126 and actual_length <= 65535:
|
||
|
length_code = 126
|
||
|
else:
|
||
|
length_code = 127
|
||
|
return (length_code, actual_length)
|
||
|
|
||
|
def server_process_handshake(handshake):
|
||
|
headers = Message(StringIO(handshake.split('\r\n', 1)[1]))
|
||
|
if headers.get("Upgrade", None) != "websocket":
|
||
|
return
|
||
|
key = headers['Sec-WebSocket-Key']
|
||
|
return key
|
||
|
|
||
|
def generate_client_nounce():
|
||
|
return b64encode(os.urandom(16)).decode('utf-8')
|
||
|
|