#!/usr/bin/env python3 import base64 import copy import datetime import json import math import re import socket import shlex import threading from collections import namedtuple from urllib.parse import urlparse, ParseResult, parse_qs, urlencode from subprocess import Popen, PIPE, TimeoutExpired from http import cookies as hcookies class MessageError(Exception): pass class ProxyException(Exception): pass class InvalidQuery(Exception): pass class SocketClosed(Exception): pass class SockBuffer: # I can't believe I have to implement this def __init__(self, sock): self.buf = [] # a list of chunks of strings self.s = sock self.closed = False def close(self): self.s.shutdown(socket.SHUT_RDWR) self.s.close() self.closed = True def _check_newline(self): for chunk in self.buf: if '\n' in chunk: return True return False def readline(self): # Receive until we get a newline, raise SocketClosed if socket is closed while True: try: data = self.s.recv(8192) except OSError: raise SocketClosed() if not data: raise SocketClosed() self.buf.append(data) if b'\n' in data: break # Combine chunks retbytes = bytes() n = 0 for chunk in self.buf: n += 1 if b'\n' in chunk: head, tail = chunk.split(b'\n', 1) retbytes += head self.buf = self.buf[n:] self.buf = [tail] + self.buf break else: retbytes += chunk return retbytes.decode() def send(self, data): try: self.s.send(data) except OSError: raise SocketClosed() class Headers: def __init__(self, headers=None): self.headers = {} if headers is not None: if isinstance(headers, Headers): for _, pairs in headers.headers.items(): for k, v in pairs: self.add(k, v) else: for k, vs in headers.items(): for v in vs: self.add(k, v) def __contains__(self, hd): for k, _ in self.headers.items(): if k.lower() == hd.lower(): return True return False def add(self, k, v): try: l = self.headers[k.lower()] l.append((k,v)) except KeyError: self.headers[k.lower()] = [(k,v)] def set(self, k, v): self.headers[k.lower()] = [(k,v)] def get(self, k): return self.headers[k.lower()][0][1] def delete(self, k): try: del self.headers[k.lower()] except KeyError: pass def pairs(self, key=None): for _, kvs in self.headers.items(): for k, v in kvs: if key is None or k.lower() == key.lower(): yield (k, v) def dict(self): retdict = {} for _, kvs in self.headers.items(): for k, v in kvs: if k in retdict: retdict[k].append(v) else: retdict[k] = [v] return retdict class RequestContext: def __init__(self, client, query=None): self._current_query = [] self.client = client if query is not None: self._current_query = query def _validate(self, query): self.client.validate_query(query) def set_query(self, query): self._validate(query) self._current_query = query def apply_phrase(self, phrase): self._validate([phrase]) self._current_query.append(phrase) def pop_phrase(self): if len(self._current_query) > 0: self._current_query.pop() def apply_filter(self, filt): self._validate([[filt]]) self._current_query.append([filt]) @property def query(self): return copy.deepcopy(self._current_query) class URL: def __init__(self, url): parsed = urlparse(url) if url is not None: parsed = urlparse(url) self.scheme = parsed.scheme self.netloc = parsed.netloc self.path = parsed.path self.params = parsed.params self.query = parsed.query self.fragment = parsed.fragment else: self.scheme = "" self.netloc = "" self.path = "/" self.params = "" self.query = "" self.fragment = "" def geturl(self, include_params=True): params = self.params query = self.query fragment = self.fragment if not include_params: params = "" query = "" fragment = "" r = ParseResult(scheme=self.scheme, netloc=self.netloc, path=self.path, params=params, query=query, fragment=fragment) return r.geturl() def parameters(self): try: return parse_qs(self.query, keep_blank_values=True) except Exception: return [] def param_iter(self): for k, vs in self.parameters().items(): for v in vs: yield k, v def set_param(self, key, val): params = self.parameters() params[key] = [val] self.query = urlencode(params) def add_param(self, key, val): params = self.parameters() if key in params: params[key].append(val) else: params[key] = [val] self.query = urlencode(params) def del_param(self, key): params = self.parameters() del params[key] self.query = urlencode(params) def set_params(self, params): self.query = urlencode(params) class InterceptMacro: """ A class representing a macro that modifies requests as they pass through the proxy """ def __init__(self): self.name = '' self.intercept_requests = False self.intercept_responses = False self.intercept_ws = False def __repr__(self): return "" % self.name def mangle_request(self, request): return request def mangle_response(self, request, response): return response def mangle_websocket(self, request, response, message): return message class HTTPRequest: def __init__(self, method="GET", path="/", proto_major=1, proto_minor=1, headers=None, body=bytes(), dest_host="", dest_port=80, use_tls=False, time_start=None, time_end=None, db_id="", tags=None, headers_only=False, storage_id=0): # http info self.method = method self.url = URL(path) self.proto_major = proto_major self.proto_minor = proto_minor self.headers = Headers(headers) self.headers_only = headers_only self._body = bytes() if not headers_only: self.body = body # metadata self.dest_host = dest_host self.dest_port = dest_port self.use_tls = use_tls self.time_start = time_start self.time_end = time_end self.response = None self.unmangled = None self.ws_messages = [] self.db_id = db_id self.storage_id = storage_id if tags is not None: self.tags = set(tags) else: self.tags = set() @property def body(self): return self._body @body.setter def body(self, bs): self.headers_only = False if type(bs) is str: self._body = bs.encode() elif type(bs) is bytes: self._body = bs else: raise Exception("invalid body type: {}".format(type(bs))) self.headers.set("Content-Length", str(len(self._body))) @property def content_length(self): if 'content-length' in self.headers: return int(self.headers.get('content-length')) return len(self.body) def status_line(self): sline = "{method} {path} HTTP/{proto_major}.{proto_minor}".format( method=self.method, path=self.url.geturl(), proto_major=self.proto_major, proto_minor=self.proto_minor).encode() return sline def headers_section(self): message = self.status_line() + b"\r\n" for k, v in self.headers.pairs(): message += "{}: {}\r\n".format(k, v).encode() return message def full_message(self): message = self.headers_section() message += b"\r\n" message += self.body return message def parameters(self): try: return parse_qs(self.body.decode(), keep_blank_values=True) except Exception: return [] def param_iter(self, ignore_content_type=False): if not ignore_content_type: if "content-type" not in self.headers: return if "www-form-urlencoded" not in self.headers.get("content-type").lower(): return for k, vs in self.parameters().items(): for v in vs: yield k, v def set_param(self, key, val): params = self.parameters() params[key] = [val] self.body = urlencode(params) def add_param(self, key, val): params = self.parameters() if key in params: params[key].append(val) else: params[key] = [val] self.body = urlencode(params) def del_param(self, key): params = self.parameters() del params[key] self.body = urlencode(params) def set_params(self, params): self.body = urlencode(params) def cookies(self): try: cookie = hcookies.BaseCookie() cookie.load(self.headers.get("cookie")) return cookie except Exception as e: return hcookies.BaseCookie() def cookie_iter(self): c = self.cookies() for k in c: yield k, c[k].value def set_cookie(self, key, val): c = self.cookies() c[key] = val self.set_cookies(c) def del_cookie(self, key): c = self.cookies() del c[key] self.set_cookies(c) def set_cookies(self, c): if isinstance(c, hcookies.BaseCookie): # it's a basecookie cookie_pairs = [] for k in c: cookie_pairs.append('{}={}'.format(k, c[k].value)) header_str = '; '.join(cookie_pairs) elif isinstance(c, HTTPRequest): # it's a request we should copy cookies from try: header_str = c.headers.get("Cookie") except KeyError: header_str = "" else: # it's a dictionary cookie_pairs = [] for k, v in c.items(): cookie_pairs.append('{}={}'.format(k, v)) header_str = '; '.join(cookie_pairs) if header_str == '': try: self.headers.delete("Cookie") except KeyError: pass else: self.headers.set("Cookie", header_str) def add_cookies(self, c): new_cookies = self.cookies() if isinstance(c, hcookies.BaseCookie): for k in c: new_cookies[k] = c[k].value elif isinstance(c, HTTPRequest): for k, v in c.cookie_iter(): new_cookies[k] = v elif isinstance(c, HTTPResponse): for k, v in c.cookie_iter(): new_cookies[k] = v else: for k, v in c.items(): new_cookies[k] = v self.set_cookies(new_cookies) def copy(self): return HTTPRequest( method=self.method, path=self.url.geturl(), proto_major=self.proto_major, proto_minor=self.proto_minor, headers=self.headers, body=self.body, dest_host=self.dest_host, dest_port=self.dest_port, use_tls=self.use_tls, tags=copy.deepcopy(self.tags), headers_only=self.headers_only, ) class HTTPResponse: def __init__(self, status_code=200, reason="OK", proto_major=1, proto_minor=1, headers=None, body=bytes(), db_id="", headers_only=False, storage_id=0): self.status_code = status_code self.reason = reason self.proto_major = proto_major self.proto_minor = proto_minor self.headers = Headers() if headers is not None: for k, vs in headers.items(): for v in vs: self.headers.add(k, v) self.headers_only = headers_only self._body = bytes() if not headers_only: self.body = body self.unmangled = None self.db_id = db_id self.storage = storage_id @property def body(self): return self._body @body.setter def body(self, bs): self.headers_only = False if type(bs) is str: self._body = bs.encode() elif type(bs) is bytes: self._body = bs else: raise Exception("invalid body type: {}".format(type(bs))) self.headers.set("Content-Length", str(len(self._body))) @property def content_length(self): if 'content-length' in self.headers: return int(self.headers.get('content-length')) return len(self.body) def status_line(self): sline = "HTTP/{proto_major}.{proto_minor} {status_code} {reason}".format( proto_major=self.proto_major, proto_minor=self.proto_minor, status_code=self.status_code, reason=self.reason).encode() return sline def headers_section(self): message = self.status_line() + b"\r\n" for k, v in self.headers.pairs(): message += "{}: {}\r\n".format(k, v).encode() return message def full_message(self): message = self.headers_section() message += b"\r\n" message += self.body return message def cookies(self): try: cookie = hcookies.BaseCookie() for _, v in self.headers.pairs('set-cookie'): cookie.load(v) return cookie except Exception as e: return hcookies.BaseCookie() def cookie_iter(self): c = self.cookies() for k in c: yield k, c[k].value def set_cookie(self, key, val): c = self.cookies() c[key] = val self.set_cookies(c) def del_cookie(self, key): c = self.cookies() del c[key] self.set_cookies(c) def set_cookies(self, c): self.headers.delete("set-cookie") if isinstance(c, hcookies.BaseCookie): cookies = c else: cookies = hcookies.BaseCookie() for k, v in c.items(): cookies[k] = v for _, m in c.items(): self.headers.add("Set-Cookie", m.OutputString()) def copy(self): return HTTPResponse( status_code=self.status_code, reason=self.reason, proto_major=self.proto_major, proto_minor=self.proto_minor, headers=self.headers.headers, body=self.body, headers_only=self.headers_only, ) class WSMessage: def __init__(self, is_binary=True, message=bytes(), to_server=True, timestamp=None, db_id="", storage_id=0): self.is_binary = is_binary self.message = message self.to_server = to_server self.timestamp = timestamp or datetime.datetime(1970, 1, 1) self.unmangled = None self.db_id = db_id self.storage = storage_id def copy(self): return WSMessage( is_binary=self.is_binary, message=self.message, to_server=self.to_server, ) ScopeResult = namedtuple("ScopeResult", ["is_custom", "filter"]) ListenerResult = namedtuple("ListenerResult", ["lid", "addr"]) GenPemCertsResult = namedtuple("GenPemCertsResult", ["key_pem", "cert_pem"]) SavedQuery = namedtuple("SavedQuery", ["name", "query"]) SavedStorage = namedtuple("SavedStorage", ["storage_id", "description"]) def messagingFunction(func): def f(self, *args, **kwargs): if self.is_interactive: raise MessageError("cannot be called while other message is interactive") if self.closed: raise MessageError("connection is closed") return func(self, *args, **kwargs) return f class ProxyConnection: next_id = 1 def __init__(self, kind="", addr=""): self.connid = ProxyConnection.next_id ProxyConnection.next_id += 1 self.sbuf = None self.buf = bytes() self.parent_client = None self.debug = False self.is_interactive = False self.closed = True self.sock_lock_read = threading.Lock() self.sock_lock_write = threading.Lock() self.kind = None self.addr = None if kind.lower() == "tcp": tcpaddr, port = addr.rsplit(":", 1) self.connect_tcp(tcpaddr, int(port)) elif kind.lower() == "unix": self.connect_unix(addr) def __enter__(self): return self def __exit__(self, exc_type, exc_value, traceback): self.close() def connect_tcp(self, addr, port): s = socket.socket(socket.AF_INET, socket.SOCK_STREAM) s.connect((addr, port)) self.sbuf = SockBuffer(s) self.closed = False self.kind = "tcp" self.addr = "{}:{}".format(addr, port) def connect_unix(self, addr): s = socket.socket(socket.AF_UNIX, socket.SOCK_STREAM) s.connect(addr) self.sbuf = SockBuffer(s) self.closed = False self.kind = "unix" self.addr = addr @property def maddr(self): if self.kind is not None: return "{}:{}".format(self.kind, self.addr) else: return None def close(self): self.sbuf.close() if self.parent_client is not None: self.parent_client.conns.remove(self) self.closed = True def read_message(self): with self.sock_lock_read: l = self.sbuf.readline() if self.debug: print("<({}) {}".format(self.connid, l)) j = json.loads(l) if "Success" in j and j["Success"] == False: if "Reason" in j: raise MessageError(j["Reason"]) raise MessageError("unknown error") return j def submit_command(self, cmd): with self.sock_lock_write: ln = json.dumps(cmd).encode()+b"\n" if self.debug: print(">({}) {} ".format(self.connid, ln.decode())) self.sbuf.send(ln) def reqrsp_cmd(self, cmd): self.submit_command(cmd) ret = self.read_message() if ret is None: raise Exception() return ret ########### ## Commands @messagingFunction def ping(self): cmd = {"Command": "Ping"} result = self.reqrsp_cmd(cmd) return result["Ping"] @messagingFunction def submit(self, req, storage=0): cmd = { "Command": "Submit", "Request": encode_req(req), "Storage": 0, } if storage is not None: cmd["Storage"] = storage result = self.reqrsp_cmd(cmd) if "SubmittedRequest" not in result: raise MessageError("no request returned") newreq = decode_req(result["SubmittedRequest"], storage=storage) req.response = newreq.response req.unmangled = newreq.unmangled req.db_id = newreq.db_id req.storage_id = storage @messagingFunction def save_new(self, req, storage): reqd = encode_req(req) cmd = { "Command": "SaveNew", "Request": encode_req(req), "Storage": storage, } result = self.reqrsp_cmd(cmd) req.db_id = result["DbId"] req.storage_id = storage return result["DbId"] def _query_storage(self, q, storage, headers_only=False, max_results=0): cmd = { "Command": "StorageQuery", "Query": q, "HeadersOnly": headers_only, "MaxResults": max_results, "Storage": storage, } result = self.reqrsp_cmd(cmd) reqs = [] unmangled = set() for reqd in result["Results"]: req = decode_req(reqd, headers_only=headers_only, storage=storage) req.storage_id = storage reqs.append(req) if req.unmangled is not None: unmangled.add(req.unmangled.db_id) return [r for r in reqs if r.db_id not in unmangled] @messagingFunction def query_storage(self, q, storage, max_results=0, headers_only=False): return self._query_storage(q, storage, headers_only=headers_only, max_results=max_results) @messagingFunction def req_by_id(self, reqid, storage, headers_only=False): results = self._query_storage([[["dbid", "is", reqid]]], storage, headers_only=headers_only, max_results=1) if len(results) == 0: raise MessageError("request with id {} does not exist".format(reqid)) return results[0] @messagingFunction def set_scope(self, filt): cmd = { "Command": "SetScope", "Query": filt, } self.reqrsp_cmd(cmd) @messagingFunction def get_scope(self): cmd = { "Command": "ViewScope", } result = self.reqrsp_cmd(cmd) ret = ScopeResult(result["IsCustom"], result["Query"]) return ret @messagingFunction def add_tag(self, reqid, tag, storage): cmd = { "Command": "AddTag", "ReqId": reqid, "Tag": tag, "Storage": storage, } self.reqrsp_cmd(cmd) @messagingFunction def remove_tag(self, reqid, tag, storage): cmd = { "Command": "RemoveTag", "ReqId": reqid, "Tag": tag, "Storage": storage, } self.reqrsp_cmd(cmd) @messagingFunction def clear_tag(self, reqid, storage): cmd = { "Command": "ClearTag", "ReqId": reqid, "Storage": storage, } self.reqrsp_cmd(cmd) @messagingFunction def all_saved_queries(self, storage): cmd = { "Command": "AllSavedQueries", "Storage": storage, } results = self.reqrsp_cmd(cmd) queries = [] for result in results["Queries"]: queries.append(SavedQuery(name=result["Name"], query=result["Query"])) return queries @messagingFunction def save_query(self, name, filt, storage): cmd = { "Command": "SaveQuery", "Name": name, "Query": filt, "Storage": storage, } self.reqrsp_cmd(cmd) @messagingFunction def load_query(self, name, storage): cmd = { "Command": "LoadQuery", "Name": name, "Storage": storage, } result = self.reqrsp_cmd(cmd) return result["Query"] @messagingFunction def delete_query(self, name, storage): cmd = { "Command": "DeleteQuery", "Name": name, "Storage": storage, } self.reqrsp_cmd(cmd) @messagingFunction def add_listener(self, addr, port, transparent=False, destHost="", destPort=0, destUseTLS=False): laddr = "{}:{}".format(addr, port) cmd = { "Command": "AddListener", "Type": "tcp", "Addr": laddr, "TransparentMode": transparent, "DestHost": destHost, "DestPort": destPort, "DestUseTLS": destUseTLS, } result = self.reqrsp_cmd(cmd) lid = result["Id"] return lid @messagingFunction def remove_listener(self, lid): cmd = { "Command": "RemoveListener", "Id": lid, } self.reqrsp_cmd(cmd) @messagingFunction def get_listeners(self): cmd = { "Command": "GetListeners", } result = self.reqrsp_cmd(cmd) results = [] for r in result["Results"]: results.append(r["Id"], r["Addr"]) return results @messagingFunction def load_certificates(self, cert_file, pkey_file): cmd = { "Command": "LoadCerts", "KeyFile": pkey_file, "CertificateFile": cert_file, } self.reqrsp_cmd(cmd) @messagingFunction def set_certificates(self, pkey_pem, cert_pem): cmd = { "Command": "SetCerts", "KeyPEMData": pkey_pem, "CertificatePEMData": cert_pem, } self.reqrsp_cmd(cmd) @messagingFunction def clear_certificates(self): cmd = { "Command": "ClearCerts", } self.reqrsp_cmd(cmd) @messagingFunction def generate_certificates(self, pkey_file, cert_file): cmd = { "Command": "GenCerts", "KeyFile": pkey_file, "CertFile": cert_file, } self.reqrsp_cmd(cmd) @messagingFunction def generate_pem_certificates(self): cmd = { "Command": "GenPEMCerts", } result = self.reqrsp_cmd(cmd) ret = GenPemCertsResult(result["KeyPEMData"], result["CertificatePEMData"]) return ret @messagingFunction def validate_query(self, query): cmd = { "Command": "ValidateQuery", "Query": query, } try: result = self.reqrsp_cmd(cmd) except MessageError as e: raise InvalidQuery(str(e)) @messagingFunction def check_request(self, query, req): cmd = { "Command": "checkrequest", "Query": query, "Request": encode_req(req), } result = self.reqrsp_cmd(cmd) return result["Result"] @messagingFunction def add_sqlite_storage(self, path, desc): cmd = { "Command": "AddSQLiteStorage", "Path": path, "Description": desc } result = self.reqrsp_cmd(cmd) return result["StorageId"] @messagingFunction def add_in_memory_storage(self, desc): cmd = { "Command": "AddInMemoryStorage", "Description": desc } result = self.reqrsp_cmd(cmd) return result["StorageId"] @messagingFunction def close_storage(self, strage_id): cmd = { "Command": "CloseStorage", "StorageId": storage_id, } result = self.reqrsp_cmd(cmd) @messagingFunction def set_proxy_storage(self, storage_id): cmd = { "Command": "SetProxyStorage", "StorageId": storage_id, } result = self.reqrsp_cmd(cmd) @messagingFunction def list_storage(self): cmd = { "Command": "ListStorage", } result = self.reqrsp_cmd(cmd) ret = [] for ss in result["Storages"]: ret.append(SavedStorage(ss["Id"], ss["Description"])) return ret @messagingFunction def set_proxy(self, use_proxy=False, proxy_host="", proxy_port=0, use_creds=False, username="", password="", is_socks=False): cmd = { "Command": "SetProxy", "UseProxy": use_proxy, "ProxyHost": proxy_host, "ProxyPort": proxy_port, "ProxyIsSOCKS": is_socks, "UseCredentials": use_creds, "Username": username, "Password": password, } self.reqrsp_cmd(cmd) @messagingFunction def intercept(self, macro): # Run an intercepting macro until closed from .util import log_error # Start intercepting self.is_interactive = True cmd = { "Command": "Intercept", "InterceptRequests": macro.intercept_requests, "InterceptResponses": macro.intercept_responses, "InterceptWS": macro.intercept_ws, } try: self.reqrsp_cmd(cmd) except Exception as e: self.is_interactive = False raise e def run_macro(): while True: try: msg = self.read_message() except MessageError as e: log_error(str(e)) return except SocketClosed: return def mangle_and_respond(msg): retCmd = None if msg["Type"] == "httprequest": req = decode_req(msg["Request"]) newReq = macro.mangle_request(req) if newReq is None: retCmd = { "Id": msg["Id"], "Dropped": True, } else: newReq.unmangled = None newReq.response = None newReq.ws_messages = [] retCmd = { "Id": msg["Id"], "Dropped": False, "Request": encode_req(newReq), } elif msg["Type"] == "httpresponse": req = decode_req(msg["Request"]) rsp = decode_rsp(msg["Response"]) newRsp = macro.mangle_response(req, rsp) if newRsp is None: retCmd = { "Id": msg["Id"], "Dropped": True, } else: newRsp.unmangled = None retCmd = { "Id": msg["Id"], "Dropped": False, "Response": encode_rsp(newRsp), } elif msg["Type"] == "wstoserver" or msg["Type"] == "wstoclient": req = decode_req(msg["Request"]) rsp = decode_rsp(msg["Response"]) wsm = decode_ws(msg["WSMessage"]) newWsm = macro.mangle_websocket(req, rsp, wsm) if newWsm is None: retCmd = { "Id": msg["Id"], "Dropped": True, } else: newWsm.unmangled = None retCmd = { "Id": msg["Id"], "Dropped": False, "WSMessage": encode_ws(newWsm), } else: raise Exception("Unknown message type: " + msg["Type"]) if retCmd is not None: try: self.submit_command(retCmd) except SocketClosed: return mangle_thread = threading.Thread(target=mangle_and_respond, args=(msg,)) mangle_thread.start() self.int_thread = threading.Thread(target=run_macro) self.int_thread.start() ActiveStorage = namedtuple("ActiveStorage", ["type", "storage_id", "prefix"]) def _serialize_storage(stype, prefix): return "{}|{}".format(stype, prefix) class ProxyClient: def __init__(self, binary=None, debug=False, conn_addr=None): self.binloc = binary self.proxy_proc = None self.ltype = None self.laddr = None self.debug = debug self.conn_addr = conn_addr self.conns = set() self.msg_conn = None # conn for single req/rsp messages self.context = RequestContext(self) self.storage_by_id = {} self.storage_by_prefix = {} self.proxy_storage = None self.inmem_storage = None self.reqrsp_methods = { "submit_command", #"reqrsp_cmd", "ping", #"submit", #"save_new", #"query_storage", #"req_by_id", "set_scope", "get_scope", # "add_tag", # "remove_tag", # "clear_tag", "all_saved_queries", "save_query", "load_query", "delete_query", "add_listener", "remove_listener", "get_listeners", "load_certificates", "set_certificates", "clear_certificates", "generate_certificates", "generate_pem_certificates", "validate_query", "check_request", "list_storage", # "add_sqlite_storage", # "add_in_memory_storage", # "close_storage", # "set_proxy_storage", "set_proxy" } def __enter__(self): if self.conn_addr is not None: self.msg_connect(self.conn_addr) else: self.execute_binary(binary=self.binloc, debug=self.debug) return self def __exit__(self, exc_type, exc_value, traceback): self.close() def __getattr__(self, name): if name in self.reqrsp_methods: return getattr(self.msg_conn, name) raise NotImplementedError(name) @property def maddr(self): if self.ltype is not None: return "{}:{}".format(self.ltype, self.laddr) else: return None def execute_binary(self, binary=None, debug=False, listen_addr=None): self.binloc = binary args = [self.binloc] if listen_addr is not None: args += ["--msglisten", listen_addr] else: args += ["--msgauto"] if debug: args += ["--dbg"] self.proxy_proc = Popen(args, stdout=PIPE, stderr=PIPE) # Wait for it to start and make connection listenstr = self.proxy_proc.stdout.readline().rstrip() self.msg_connect(listenstr.decode()) def msg_connect(self, addr): self.ltype, self.laddr = addr.split(":", 1) self.msg_conn = self.new_conn() self._get_storage() def close(self): conns = list(self.conns) for conn in conns: conn.close() if self.proxy_proc is not None: self.proxy_proc.terminate() def new_conn(self): conn = ProxyConnection(kind=self.ltype, addr=self.laddr) conn.parent_client = self conn.debug = self.debug self.conns.add(conn) return conn # functions involving storage def _add_storage(self, storage, prefix): self.storage_by_prefix[prefix] = storage self.storage_by_id[storage.storage_id] = storage def _clear_storage(self): self.storage_by_prefix = {} self.storage_by_id = {} def _get_storage(self): self._clear_storage() storages = self.list_storage() for s in storages: stype, prefix = s.description.split("|") storage = ActiveStorage(stype, s.storage_id, prefix) self._add_storage(storage, prefix) def parse_reqid(self, reqid): if reqid[0].isalpha(): prefix = reqid[0] realid = reqid[1:] else: prefix = "" realid = reqid # `u`, `s` are special cases for the unmangled version of req and rsp if prefix == 'u': req = self.req_by_id(realid) if req.unmangled is None: raise MessageError("request %s was not mangled" % reqid) ureq = req.unmangled return self.storage_by_id[ureq.storage_id], ureq.db_id elif prefix == 's': req = self.req_by_id(realid) if req.response is None: raise MessageError("response %s was not mangled" % reqid) if req.response.unmangled is None: raise MessageError("response %s was not mangled" % reqid) return self.storage_by_id[req.storage_id], req.db_id else: storage = self.storage_by_prefix[prefix] return storage, realid def storage_iter(self): for _, s in self.storage_by_id.items(): yield s def _stg_or_def(self, storage): if storage is None: return self.proxy_storage return storage def is_in_context(self, req): return self.check_request(self.context.query, req) def in_context_requests(self, headers_only=False, max_results=0): results = self.query_storage(self.context.query, headers_only=headers_only, max_results=max_results) ret = results if max_results > 0 and len(results) > max_results: ret = results[:max_results] return ret def in_context_requests_iter(self, headers_only=False, max_results=0): results = self.query_storage(self.context.query, headers_only=headers_only, max_results=max_results) ret = results if max_results > 0 and len(results) > max_results: ret = results[:max_results] for reqh in ret: req = self.req_by_id(reqh.db_id, storage_id=reqh.storage_id) yield req def get_reqid(self, req): prefix = "" if req.storage_id in self.storage_by_id: s = self.storage_by_id[req.storage_id] prefix = s.prefix return "{}{}".format(prefix, req.db_id) # functions that don't just pass through to underlying conn def add_sqlite_storage(self, path, prefix): desc = _serialize_storage("sqlite", prefix) sid = self.msg_conn.add_sqlite_storage(path, desc) s = ActiveStorage(type="sqlite", storage_id=sid, prefix=prefix) self._add_storage(s, prefix) return s def add_in_memory_storage(self, prefix): desc = _serialize_storage("inmem", prefix) sid = self.msg_conn.add_in_memory_storage(desc) s = ActiveStorage(type="inmem", storage_id=sid, prefix=prefix) self._add_storage(s, prefix) return s def close_storage(self, storage_id): s = self.storage_by_id[storage_id] self.msg_conn.close_storage(s.storage_id) del self.storage_by_id[s.storage_id] del self.storage_by_prefix[s.storage_prefix] def set_proxy_storage(self, storage_id): s = self.storage_by_id[storage_id] self.msg_conn.set_proxy_storage(s.storage_id) self.proxy_storage = storage_id def save_new(self, req, inmem=False, storage=None): if inmem: storage = self.inmem_storage else: storage = self._stg_or_def(storage) self.msg_conn.save_new(req, storage=storage) def submit(self, req, save=False, inmem=False, storage=None): if save: storage = self._stg_or_def(storage) if inmem: storage = self.inmem_storage self.msg_conn.submit(req, storage=storage) def query_storage(self, q, max_results=0, headers_only=False, storage=None): results = [] if storage is None: for s in self.storage_iter(): results += self.msg_conn.query_storage(q, max_results=max_results, headers_only=headers_only, storage=s.storage_id) else: results += self.msg_conn.query_storage(q, max_results=max_results, headers_only=headers_only, storage=storage) def kfunc(req): if req.time_start is None: return datetime.datetime.utcfromtimestamp(0) return req.time_start results.sort(key=kfunc) results = [r for r in reversed(results)] return results def req_by_id(self, reqid, storage_id=None, headers_only=False): if storage_id is None: storage, db_id = self.parse_reqid(reqid) storage_id = storage.storage_id else: db_id = reqid retreq = self.msg_conn.req_by_id(db_id, headers_only=headers_only, storage=storage_id) if reqid[0] == 's': # `u` is handled by parse_reqid retreq.response = retreq.response.unmangled return retreq # for these and submit, might need storage stored on the request itself def add_tag(self, reqid, tag, storage=None): self.msg_conn.add_tag(reqid, tag, storage=self._stg_or_def(storage)) def remove_tag(self, reqid, tag, storage=None): self.msg_conn.remove_tag(reqid, tag, storage=self._stg_or_def(storage)) def clear_tag(self, reqid, storage=None): self.msg_conn.clear_tag(reqid, storage=self._stg_or_def(storage)) def all_saved_queries(self, storage=None): self.msg_conn.all_saved_queries(storage=None) def save_query(self, name, filt, storage=None): self.msg_conn.save_query(name, filt, storage=self._stg_or_def(storage)) def load_query(self, name, storage=None): self.msg_conn.load_query(name, storage=self._stg_or_def(storage)) def delete_query(self, name, storage=None): self.msg_conn.delete_query(name, storage=self._stg_or_def(storage)) def decode_req(result, headers_only=False, storage=0): if "StartTime" in result and result["StartTime"] > 0: time_start = time_from_nsecs(result["StartTime"]) else: time_start = None if "EndTime" in result and result["EndTime"] > 0: time_end = time_from_nsecs(result["EndTime"]) else: time_end = None if "DbId" in result: db_id = result["DbId"] else: db_id = "" if "Tags" in result: tags = result["Tags"] else: tags = "" ret = HTTPRequest( method=result["Method"], path=result["Path"], proto_major=result["ProtoMajor"], proto_minor=result["ProtoMinor"], headers=copy.deepcopy(result["Headers"]), body=base64.b64decode(result["Body"]), dest_host=result["DestHost"], dest_port=result["DestPort"], use_tls=result["UseTLS"], time_start=time_start, time_end=time_end, tags=tags, headers_only=headers_only, db_id=db_id, storage_id=storage, ) if "Unmangled" in result: ret.unmangled = decode_req(result["Unmangled"], headers_only=headers_only, storage=storage) if "Response" in result: ret.response = decode_rsp(result["Response"], headers_only=headers_only, storage=storage) if "WSMessages" in result: for wsm in result["WSMessages"]: ret.ws_messages.append(decode_ws(wsm, storage=storage)) return ret def decode_rsp(result, headers_only=False, storage=0): ret = HTTPResponse( status_code=result["StatusCode"], reason=result["Reason"], proto_major=result["ProtoMajor"], proto_minor=result["ProtoMinor"], headers=copy.deepcopy(result["Headers"]), body=base64.b64decode(result["Body"]), headers_only=headers_only, storage_id=storage, ) if "Unmangled" in result: ret.unmangled = decode_rsp(result["Unmangled"], headers_only=headers_only, storage=storage) return ret def decode_ws(result, storage=0): timestamp = None db_id = "" if "Timestamp" in result: timestamp = time_from_nsecs(result["Timestamp"]) if "DbId" in result: db_id = result["DbId"] ret = WSMessage( is_binary=result["IsBinary"], message=base64.b64decode(result["Message"]), to_server=result["ToServer"], timestamp=timestamp, db_id=db_id, storage=storage, ) if "Unmangled" in result: ret.unmangled = decode_ws(result["Unmangled"], storage=storage) return ret def encode_req(req, int_rsp=False): msg = { "DestHost": req.dest_host, "DestPort": req.dest_port, "UseTLS": req.use_tls, "Method": req.method, "Path": req.url.geturl(), "ProtoMajor": req.proto_major, "ProtoMinor": req.proto_major, "Headers": req.headers.dict(), "Tags": list(req.tags), "Body": base64.b64encode(copy.copy(req.body)).decode(), } if not int_rsp: msg["StartTime"] = time_to_nsecs(req.time_start) msg["EndTime"] = time_to_nsecs(req.time_end) if req.unmangled is not None: msg["Unmangled"] = encode_req(req.unmangled) if req.response is not None: msg["Response"] = encode_rsp(req.response) msg["WSMessages"] = [] for wsm in req.ws_messages: msg["WSMessages"].append(encode_ws(wsm)) return msg def encode_rsp(rsp, int_rsp=False): msg = { "ProtoMajor": rsp.proto_major, "ProtoMinor": rsp.proto_minor, "StatusCode": rsp.status_code, "Reason": rsp.reason, "Headers": rsp.headers.dict(), "Body": base64.b64encode(copy.copy(rsp.body)).decode(), } if not int_rsp: if rsp.unmangled is not None: msg["Unmangled"] = encode_rsp(rsp.unmangled) return msg def encode_ws(ws, int_rsp=False): msg = { "Message": base64.b64encode(ws.message).decode(), "IsBinary": ws.is_binary, "toServer": ws.to_server, } if not int_rsp: if ws.unmangled is not None: msg["Unmangled"] = encode_ws(ws.unmangled) msg["Timestamp"] = time_to_nsecs(ws.timestamp) msg["DbId"] = ws.db_id return msg def time_from_nsecs(nsecs): secs = nsecs/1000000000 t = datetime.datetime.utcfromtimestamp(secs) return t def time_to_nsecs(t): if t is None: return None secs = (t-datetime.datetime(1970,1,1)).total_seconds() return int(math.floor(secs * 1000000000)) RequestStatusLine = namedtuple("RequestStatusLine", ["method", "path", "proto_major", "proto_minor"]) ResponseStatusLine = namedtuple("ResponseStatusLine", ["proto_major", "proto_minor", "status_code", "reason"]) def parse_req_sline(sline): if len(sline.split(b' ')) == 3: verb, path, version = sline.split(b' ') elif len(parts) == 2: verb, version = parts.split(b' ') path = b'' else: raise ParseError("malformed statusline") raw_version = version[5:] # strip HTTP/ pmajor, pminor = raw_version.split(b'.', 1) return RequestStatusLine(verb.decode(), path.decode(), int(pmajor), int(pminor)) def parse_rsp_sline(sline): if len(sline.split(b' ')) > 2: version, status_code, reason = sline.split(b' ', 2) else: version, status_code = sline.split(b' ', 1) reason = '' raw_version = version[5:] # strip HTTP/ pmajor, pminor = raw_version.split(b'.', 1) return ResponseStatusLine(int(pmajor), int(pminor), int(status_code), reason.decode()) def _parse_message(bs, sline_parser): header_env, body = re.split(b"\r?\n\r?\n", bs, 1) status_line, header_bytes = re.split(b"\r?\n", header_env, 1) h = Headers() for l in re.split(b"\r?\n", header_bytes): k, v = l.split(b": ", 1) if k.lower != 'content-length': h.add(k.decode(), v.decode()) h.add("Content-Length", str(len(body))) return (sline_parser(status_line), h, body) def parse_request(bs, dest_host='', dest_port=80, use_tls=False): req_sline, headers, body = _parse_message(bs, parse_req_sline) req = HTTPRequest( method=req_sline.method, path=req_sline.path, proto_major=req_sline.proto_major, proto_minor=req_sline.proto_minor, headers=headers.dict(), body=body, dest_host=dest_host, dest_port=dest_port, use_tls=use_tls, ) return req def parse_response(bs): rsp_sline, headers, body = _parse_message(bs, parse_rsp_sline) rsp = HTTPResponse( status_code=rsp_sline.status_code, reason=rsp_sline.reason, proto_major=rsp_sline.proto_major, proto_minor=rsp_sline.proto_minor, headers=headers.dict(), body=body, ) return rsp