From 82a90511bc61b4ed98cd7ff2455b79dec015c45f Mon Sep 17 00:00:00 2001 From: Chris Czub Date: Mon, 9 Nov 2015 11:06:16 -0500 Subject: [PATCH 1/4] Add "add" ContentView method & test --- libmproxy/contentviews.py | 8 ++++++++ test/test_contentview.py | 13 +++++++++++++ 2 files changed, 21 insertions(+) diff --git a/libmproxy/contentviews.py b/libmproxy/contentviews.py index 9af080335..8d5aadfce 100644 --- a/libmproxy/contentviews.py +++ b/libmproxy/contentviews.py @@ -515,6 +515,14 @@ def get_by_shortcut(c): return i +def add(obj): + for i in views: + if i.name == obj.name: + raise ContentViewException("Duplicate view: " + obj.name) + + views.append(obj) + + def get(name): for i in views: if i.name == name: diff --git a/test/test_contentview.py b/test/test_contentview.py index 976085209..68272fca3 100644 --- a/test/test_contentview.py +++ b/test/test_contentview.py @@ -210,6 +210,19 @@ Larry assert "decoded gzip" in r[0] assert "Raw" in r[0] + def test_add_cv(self): + class TestContentView(cv.View): + name = "test" + + tcv = TestContentView() + cv.add(tcv) + + tutils.raises( + ContentViewException, + cv.add, + tcv + ) + if pyamf: def test_view_amf_request(): From d7239d665e6781d7b84ecfde3fd5d7d1831de284 Mon Sep 17 00:00:00 2001 From: Chris Czub Date: Mon, 9 Nov 2015 15:07:08 -0500 Subject: [PATCH 2/4] Add new contentviews' content type mappings --- libmproxy/contentviews.py | 10 ++++++++++ test/test_contentview.py | 1 + 2 files changed, 11 insertions(+) diff --git a/libmproxy/contentviews.py b/libmproxy/contentviews.py index 8d5aadfce..aa2082d1c 100644 --- a/libmproxy/contentviews.py +++ b/libmproxy/contentviews.py @@ -520,8 +520,18 @@ def add(obj): if i.name == obj.name: raise ContentViewException("Duplicate view: " + obj.name) + for prompt in view_prompts: + if prompt[1] == obj.prompt[1]: + raise ContentViewException("Duplicate view shortcut: " + obj.prompt[1]) + views.append(obj) + for ct in obj.content_types: + l = content_types_map.setdefault(ct, []) + l.append(obj) + + view_prompts.append(obj.prompt) + def get(name): for i in views: diff --git a/test/test_contentview.py b/test/test_contentview.py index 68272fca3..c1e437e49 100644 --- a/test/test_contentview.py +++ b/test/test_contentview.py @@ -217,6 +217,7 @@ Larry tcv = TestContentView() cv.add(tcv) + # repeated addition causes exception tutils.raises( ContentViewException, cv.add, From d3feaa3bc6e2d9c2c7ee8286038c69c0b9601869 Mon Sep 17 00:00:00 2001 From: Chris Czub Date: Mon, 9 Nov 2015 15:07:58 -0500 Subject: [PATCH 3/4] Add custom content view plugin support for mitmproxy/mitmdump --- libmproxy/flow.py | 46 ++++++++++++++++++++++++++++++- libmproxy/script.py | 7 +++++ test/test_custom_contentview.py | 49 +++++++++++++++++++++++++++++++++ test/test_script.py | 10 +++++++ 4 files changed, 111 insertions(+), 1 deletion(-) create mode 100644 test/test_custom_contentview.py diff --git a/libmproxy/flow.py b/libmproxy/flow.py index 55a4dbcfb..5acbebf21 100644 --- a/libmproxy/flow.py +++ b/libmproxy/flow.py @@ -9,7 +9,7 @@ import cookielib import os import re import urlparse - +import inspect from netlib import wsgi from netlib.exceptions import HttpException @@ -21,6 +21,11 @@ from .proxy.config import HostMatcher from .protocol.http_replay import RequestReplayThread from .protocol import Kill from .models import ClientConnection, ServerConnection, HTTPResponse, HTTPFlow, HTTPRequest +from . import contentviews as cv + + +class PluginError(Exception): + pass class AppRegistry: @@ -614,6 +619,43 @@ class State(object): self.flows.kill_all(master) +class Plugins(object): + def __init__(self): + self._view_plugins = {} + + def __iter__(self): + for plugin_type in ('view_plugins',): + yield (plugin_type, getattr(self, '_' + plugin_type)) + + def __getitem__(self, key): + if key in ('view_plugins',): + return getattr(self, '_' + key) + else: + return None + + def register_view(self, id, **kwargs): + if self._view_plugins.get(id): + raise PluginError("Duplicate view registration for %s" % (id, )) + + if not kwargs.get('class_ref') or not \ + callable(kwargs['class_ref']) or not \ + isinstance(kwargs['class_ref'], type): + raise PluginError("No custom content view class passed for view %s" % (id, )) + + script_path = inspect.stack()[1][1] + + view_plugin = { + 'title': kwargs.get('title') or id, + 'class_ref': kwargs['class_ref'], + 'script_path': script_path, + } + self._view_plugins[id] = view_plugin + + cv.add(kwargs['class_ref']()) + + print("Registered view plugin %s from script %s" % (kwargs['title'], script_path)) + + class FlowMaster(controller.Master): def __init__(self, server, state): controller.Master.__init__(self, server) @@ -643,6 +685,8 @@ class FlowMaster(controller.Master): self.stream = None self.apps = AppRegistry() + self.plugins = Plugins() + def start_app(self, host, port): self.apps.add( app.mapp, diff --git a/libmproxy/script.py b/libmproxy/script.py index 9d051c129..f11c5cd87 100644 --- a/libmproxy/script.py +++ b/libmproxy/script.py @@ -56,6 +56,13 @@ class ScriptContext: def app_registry(self): return self._master.apps + @property + def plugins(self): + if hasattr(self._master, 'plugins'): + return self._master.plugins + + return None + class Script: """ diff --git a/test/test_custom_contentview.py b/test/test_custom_contentview.py new file mode 100644 index 000000000..2ca184d0a --- /dev/null +++ b/test/test_custom_contentview.py @@ -0,0 +1,49 @@ +from libmproxy import script, flow +import libmproxy.contentviews as cv +from netlib.http import Headers + + +def test_custom_views(): + plugins = flow.Plugins() + + # two types: view and action + assert 'view_plugins' in dict(plugins).keys() + + view_plugins = plugins['view_plugins'] + assert len(view_plugins) == 0 + + class ViewNoop(cv.View): + name = "noop" + prompt = ("noop", "n") + content_types = ["text/none"] + + def __call__(self, data, **metadata): + return "noop", cv.format_text(data) + + plugins.register_view('noop', + title='Noop View Plugin', + class_ref=ViewNoop) + + assert len(view_plugins) == 1 + assert view_plugins['noop']['title'] == 'Noop View Plugin' + + assert cv.get("noop") + + r = cv.get_content_view( + cv.get("noop"), + "[1, 2, 3]", + headers=Headers( + content_type="text/plain" + ) + ) + assert "noop" in r[0] + + # now try content-type matching + r = cv.get_content_view( + cv.get("Auto"), + "[1, 2, 3]", + headers=Headers( + content_type="text/none" + ) + ) + assert "noop" in r[0] diff --git a/test/test_script.py b/test/test_script.py index 1b0e5a5b4..f0883ad5e 100644 --- a/test/test_script.py +++ b/test/test_script.py @@ -127,3 +127,13 @@ def test_command_parsing(): absfilepath = os.path.normcase(tutils.test_data.path("scripts/a.py")) s = script.Script(absfilepath, fm) assert os.path.isfile(s.args[0]) + + +def test_script_plugins(): + s = flow.State() + fm = flow.FlowMaster(None, s) + sp = tutils.test_data.path("scripts/a.py") + p = script.Script("%s --var 40" % sp, fm) + + assert hasattr(p.ctx, 'plugins') + From e72a9a62a107ea3f53b6b26d1abe63c554448d17 Mon Sep 17 00:00:00 2001 From: Chris Czub Date: Fri, 13 Nov 2015 16:55:27 -0500 Subject: [PATCH 4/4] Feedback from PR #832 --- examples/custom_contentviews.py | 66 +++++++++++++++++++++++++++ libmproxy/contentviews.py | 81 ++++++++++++++++++--------------- libmproxy/flow.py | 43 ----------------- libmproxy/script.py | 11 +++-- test/test_contentview.py | 1 + test/test_custom_contentview.py | 29 ++++++------ test/test_script.py | 9 ---- 7 files changed, 134 insertions(+), 106 deletions(-) create mode 100644 examples/custom_contentviews.py diff --git a/examples/custom_contentviews.py b/examples/custom_contentviews.py new file mode 100644 index 000000000..1a2bcb1e8 --- /dev/null +++ b/examples/custom_contentviews.py @@ -0,0 +1,66 @@ +import string +from libmproxy import script, flow, utils +import libmproxy.contentviews as cv +from netlib.http import Headers +import lxml.html +import lxml.etree + + +class ViewPigLatin(cv.View): + name = "pig_latin_HTML" + prompt = ("pig latin HTML", "l") + content_types = ["text/html"] + + def __call__(self, data, **metadata): + if utils.isXML(data): + parser = lxml.etree.HTMLParser( + strip_cdata=True, + remove_blank_text=True + ) + d = lxml.html.fromstring(data, parser=parser) + docinfo = d.getroottree().docinfo + + def piglify(src): + words = string.split(src) + ret = '' + for word in words: + idx = -1 + while word[idx] in string.punctuation and (idx * -1) != len(word): idx -= 1 + if word[0].lower() in 'aeiou': + if idx == -1: ret += word[0:] + "hay" + else: ret += word[0:len(word)+idx+1] + "hay" + word[idx+1:] + else: + if idx == -1: ret += word[1:] + word[0] + "ay" + else: ret += word[1:len(word)+idx+1] + word[0] + "ay" + word[idx+1:] + ret += ' ' + return ret.strip() + + def recurse(root): + if hasattr(root, 'text') and root.text: + root.text = piglify(root.text) + if hasattr(root, 'tail') and root.tail: + root.tail = piglify(root.tail) + + if len(root): + for child in root: + recurse(child) + + recurse(d) + + s = lxml.etree.tostring( + d, + pretty_print=True, + doctype=docinfo.doctype + ) + return "HTML", cv.format_text(s) + + +pig_view = ViewPigLatin() + + +def start(context, argv): + context.add_contentview(pig_view) + + +def stop(context): + context.remove_contentview(pig_view) diff --git a/libmproxy/contentviews.py b/libmproxy/contentviews.py index aa2082d1c..2f46cccaf 100644 --- a/libmproxy/contentviews.py +++ b/libmproxy/contentviews.py @@ -479,34 +479,9 @@ class ViewWBXML(View): return None -views = [ - ViewAuto(), - ViewRaw(), - ViewHex(), - ViewJSON(), - ViewXML(), - ViewWBXML(), - ViewHTML(), - ViewHTMLOutline(), - ViewJavaScript(), - ViewCSS(), - ViewURLEncoded(), - ViewMultipart(), - ViewImage(), -] -if pyamf: - views.append(ViewAMF()) - -if ViewProtobuf.is_available(): - views.append(ViewProtobuf()) - +views = [] content_types_map = {} -for i in views: - for ct in i.content_types: - l = content_types_map.setdefault(ct, []) - l.append(i) - -view_prompts = [i.prompt for i in views] +view_prompts = [] def get_by_shortcut(c): @@ -515,24 +490,58 @@ def get_by_shortcut(c): return i -def add(obj): +def add(view): + # TODO: auto-select a different name (append an integer?) for i in views: - if i.name == obj.name: - raise ContentViewException("Duplicate view: " + obj.name) + if i.name == view.name: + raise ContentViewException("Duplicate view: " + view.name) + # TODO: the UI should auto-prompt for a replacement shortcut for prompt in view_prompts: - if prompt[1] == obj.prompt[1]: - raise ContentViewException("Duplicate view shortcut: " + obj.prompt[1]) + if prompt[1] == view.prompt[1]: + raise ContentViewException("Duplicate view shortcut: " + view.prompt[1]) - views.append(obj) + views.append(view) - for ct in obj.content_types: + for ct in view.content_types: l = content_types_map.setdefault(ct, []) - l.append(obj) + l.append(view) - view_prompts.append(obj.prompt) + view_prompts.append(view.prompt) +def remove(view): + for ct in view.content_types: + l = content_types_map.setdefault(ct, []) + l.remove(view) + + if not len(l): + del content_types_map[ct] + + view_prompts.remove(view.prompt) + views.remove(view) + + +add(ViewAuto()) +add(ViewRaw()) +add(ViewHex()) +add(ViewJSON()) +add(ViewXML()) +add(ViewWBXML()) +add(ViewHTML()) +add(ViewHTMLOutline()) +add(ViewJavaScript()) +add(ViewCSS()) +add(ViewURLEncoded()) +add(ViewMultipart()) +add(ViewImage()) + +if pyamf: + add(ViewAMF()) + +if ViewProtobuf.is_available(): + add(ViewProtobuf()) + def get(name): for i in views: if i.name == name: diff --git a/libmproxy/flow.py b/libmproxy/flow.py index 5acbebf21..3343e694f 100644 --- a/libmproxy/flow.py +++ b/libmproxy/flow.py @@ -24,10 +24,6 @@ from .models import ClientConnection, ServerConnection, HTTPResponse, HTTPFlow, from . import contentviews as cv -class PluginError(Exception): - pass - - class AppRegistry: def __init__(self): self.apps = {} @@ -619,43 +615,6 @@ class State(object): self.flows.kill_all(master) -class Plugins(object): - def __init__(self): - self._view_plugins = {} - - def __iter__(self): - for plugin_type in ('view_plugins',): - yield (plugin_type, getattr(self, '_' + plugin_type)) - - def __getitem__(self, key): - if key in ('view_plugins',): - return getattr(self, '_' + key) - else: - return None - - def register_view(self, id, **kwargs): - if self._view_plugins.get(id): - raise PluginError("Duplicate view registration for %s" % (id, )) - - if not kwargs.get('class_ref') or not \ - callable(kwargs['class_ref']) or not \ - isinstance(kwargs['class_ref'], type): - raise PluginError("No custom content view class passed for view %s" % (id, )) - - script_path = inspect.stack()[1][1] - - view_plugin = { - 'title': kwargs.get('title') or id, - 'class_ref': kwargs['class_ref'], - 'script_path': script_path, - } - self._view_plugins[id] = view_plugin - - cv.add(kwargs['class_ref']()) - - print("Registered view plugin %s from script %s" % (kwargs['title'], script_path)) - - class FlowMaster(controller.Master): def __init__(self, server, state): controller.Master.__init__(self, server) @@ -685,8 +644,6 @@ class FlowMaster(controller.Master): self.stream = None self.apps = AppRegistry() - self.plugins = Plugins() - def start_app(self, host, port): self.apps.add( app.mapp, diff --git a/libmproxy/script.py b/libmproxy/script.py index f11c5cd87..4da40c52f 100644 --- a/libmproxy/script.py +++ b/libmproxy/script.py @@ -5,6 +5,8 @@ import threading import shlex import sys +from . import contentviews as cv + class ScriptError(Exception): pass @@ -56,12 +58,11 @@ class ScriptContext: def app_registry(self): return self._master.apps - @property - def plugins(self): - if hasattr(self._master, 'plugins'): - return self._master.plugins + def add_contentview(self, view_obj): + cv.add(view_obj) - return None + def remove_contentview(self, view_obj): + cv.remove(view_obj) class Script: diff --git a/test/test_contentview.py b/test/test_contentview.py index c1e437e49..eba624a26 100644 --- a/test/test_contentview.py +++ b/test/test_contentview.py @@ -213,6 +213,7 @@ Larry def test_add_cv(self): class TestContentView(cv.View): name = "test" + prompt = ("t", "test") tcv = TestContentView() cv.add(tcv) diff --git a/test/test_custom_contentview.py b/test/test_custom_contentview.py index 2ca184d0a..4b5a3e53f 100644 --- a/test/test_custom_contentview.py +++ b/test/test_custom_contentview.py @@ -4,14 +4,6 @@ from netlib.http import Headers def test_custom_views(): - plugins = flow.Plugins() - - # two types: view and action - assert 'view_plugins' in dict(plugins).keys() - - view_plugins = plugins['view_plugins'] - assert len(view_plugins) == 0 - class ViewNoop(cv.View): name = "noop" prompt = ("noop", "n") @@ -20,12 +12,10 @@ def test_custom_views(): def __call__(self, data, **metadata): return "noop", cv.format_text(data) - plugins.register_view('noop', - title='Noop View Plugin', - class_ref=ViewNoop) - assert len(view_plugins) == 1 - assert view_plugins['noop']['title'] == 'Noop View Plugin' + view_obj = ViewNoop() + + cv.add(view_obj) assert cv.get("noop") @@ -47,3 +37,16 @@ def test_custom_views(): ) ) assert "noop" in r[0] + + # now try removing the custom view + cv.remove(view_obj) + r = cv.get_content_view( + cv.get("Auto"), + "[1, 2, 3]", + headers=Headers( + content_type="text/none" + ) + ) + assert "noop" not in r[0] + + diff --git a/test/test_script.py b/test/test_script.py index f0883ad5e..8612d5f34 100644 --- a/test/test_script.py +++ b/test/test_script.py @@ -128,12 +128,3 @@ def test_command_parsing(): s = script.Script(absfilepath, fm) assert os.path.isfile(s.args[0]) - -def test_script_plugins(): - s = flow.State() - fm = flow.FlowMaster(None, s) - sp = tutils.test_data.path("scripts/a.py") - p = script.Script("%s --var 40" % sp, fm) - - assert hasattr(p.ctx, 'plugins') -