Fix bugs

Jugendhackt · Jun 1, 2017 · 0915d24 · 0915d24
1 parent d878209
commit 0915d24
Show file tree

Hide file tree

Showing 5 changed files with 72 additions and 57 deletions.
diff --git a/README.md b/README.md
@@ -16,9 +16,9 @@ After that you can install the dependencies from the requirements.txt via
     pip install -r requirements.txt
 
 ## Running it
-To run neulandeuphonie you simply start the proxy.py executing
+To run neulandeuphonie you simply start the proxy by executing
 
-    python proxy.py
+    mitmdump -s neulandeuph.py
 
 It will start a proxy on *:8080 which you can set in your browser.
 

diff --git a/neulandeuph.py b/neulandeuph.py
@@ -0,0 +1,34 @@
+import proxy_functions
+import configparser as ConfigParser
+import glob, os, re, json
+config = ConfigParser.ConfigParser()
+config.read(['default.ini', 'local.ini'])
+regex_flags = re.IGNORECASE
+tag_expressions = {"fallback": config.get("general", "fallback_language")}
+content_expressions = {"fallback": config.get("general", "fallback_language")}
+for filename in glob.glob("tag_replace/*.json"):
+    with open(filename) as regex_file:
+        lang = os.path.splitext(os.path.basename(filename))[0]
+        tag_expressions[lang] = []
+        regex_list = json.load(regex_file)
+        for expression, replacement_text in regex_list.items():
+            compiled_expression = re.compile(expression, regex_flags)
+            tag_expressions[lang].append((compiled_expression, replacement_text))
+for filename in glob.glob("content_replace/*.json"):
+    with open(filename) as regex_file:
+        lang = os.path.splitext(os.path.basename(filename))[0]
+        content_expressions[lang] = []
+        regex_list = json.load(regex_file)
+        for expression, replacement_text in regex_list.items():
+            compiled_expression = re.compile(expression, regex_flags)
+            content_expressions[lang].append((compiled_expression, replacement_text))
+
+def response(flow):
+    flow = proxy_functions.replaceImage(flow)
+    flow = proxy_functions.censorText(flow, tag_expressions, content_expressions, config.get("general", "stylesheet_file"), config.getboolean("general", "send_stats"), config.getboolean("general","replace"))
+    #flow.reply()
+    return flow
+
+
+def handle_response(*args, **kwargs):
+    print(args, kwargs)
diff --git a/proxy.py b/proxy.py
@@ -1,21 +1,18 @@
 #!/usr/bin/env python
 # -*- coding: utf-8 -*-
-import sys; reload(sys); sys.setdefaultencoding("utf-8") # hack to set default encoding
 import json
 import re
-from libmproxy import controller, proxy
-from libmproxy.proxy.server import ProxyServer
+from mitmproxy import controller, proxy
+from mitmproxy.proxy.server import ProxyServer
 import proxy_functions
 import threading
-import ConfigParser
+import configparser as ConfigParser
 import glob
 import os
 
 
-class CensorMaster(controller.Master):
-
+class CensorMaster():
     def __init__(self, server):
-        controller.Master.__init__(self, server)
         self.config = ConfigParser.ConfigParser()
         self.config.read(['default.ini', 'local.ini'])
         self.regex_flags = re.IGNORECASE

diff --git a/proxy_functions.py b/proxy_functions.py
@@ -1,13 +1,12 @@
 import re
-from wand.image import Image
+from PIL import Image
 import io
 import requests
 import os
 import random
 import sys
-from libmproxy.protocol.http import HTTPResponse
-from netlib.odict import ODictCaseless
-import StringIO
+from mitmproxy.http import HTTPResponse
+import io
 from bs4 import BeautifulSoup, NavigableString
 import linecache
 
@@ -19,7 +18,7 @@ def PrintException():
     filename = f.f_code.co_filename
     linecache.checkcache(filename)
     line = linecache.getline(filename, lineno, f.f_globals)
-    print 'EXCEPTION IN ({}, LINE {} "{}"): {}'.format(filename, lineno, line.strip(), exc_obj)
+    print('EXCEPTION IN ({}, LINE {} "{}"): {}'.format(filename, lineno, line.strip(), exc_obj))
 
 
 def getsizes(image_data):
@@ -28,38 +27,43 @@ def getsizes(image_data):
 
 
 def resizeImg(sourceFile, width, height):
-    img = Image(filename=sourceFile)
-    if width > height:
+    img = Image.open(sourceFile)
+    """if width > height:
         img.transform(resize="%d" % (width))
     else:
-        img.transform(resize="x%d" % (height))
+        img.transform(resize="x%d" % (height))"""
+    img.thumbnail((width, height))
     wd = img.width - width
     hd = img.height - height
-    img.crop(wd / 2, hd / 2, width=width, height=height)
+    img.crop((wd / 2, hd / 2, width, height))
     img.format = 'jpeg'
     return img
 
 
 def replaceImage(flow):
-    attrs = dict((x.lower(), y) for x, y in flow.response.headers)
+    attrs = dict((x.lower(), y) for x, y in flow.response.headers.items())
     if "content-type" in attrs:
         if "image" in attrs['content-type'] and not "svg" in attrs['content-type']:
-            if flow.response.code == 304:
+            if flow.response.status_code == 304:
                 content = flow.response.content
             else:
                 content = requests.get(flow.request.url).content
             if len(content) == 0:
                 return flow
             try:
-                img = Image(file=io.BytesIO(content))
+                img = Image.open(io.BytesIO(content))
                 size = img.size
                 if size[0] > 40 and size[1] > 40:
                     filename = random.choice(os.listdir("images"))
                     img = resizeImg("images/" + filename, size[0], size[1])
-                    content = img.make_blob()
-                    responseHeaders = ODictCaseless([('Content-Length', len(content))])
-                    responseHeaders['Content-Type'] = ["image/jpg"]
-                    resp = HTTPResponse([1, 1], 200, 'OK', responseHeaders, content)
+                    #content = img.make_blob()
+                    imgByteArr = io.BytesIO()
+                    img.save(imgByteArr, format='JPEG')
+                    content = imgByteArr.getvalue()
+                    responseHeaders = {'Content-Length':str(len(content))}
+                    responseHeaders['Content-Type'] = "image/jpg"
+                    #import pdb;pdb.set_trace()
+                    resp = HTTPResponse.make(status_code=200, headers=responseHeaders, content=content)
                     flow.response = resp
 
             except:
@@ -76,23 +80,24 @@ def adjustCasing(original, to_adjust):
 
 
 def censorText(flow, tag_expressions, content_expressions, stylesheet, send_stats, replace=False):
-    attrs = dict((x.lower(), y) for x, y in flow.response.headers)
+    attrs = dict((x.lower(), y) for x, y in flow.response.headers.items())
     if 'content-type' in attrs:
         if ('text/html' in attrs['content-type']):
             if send_stats:
                 stat = {"type": "statistic", "changes": []}
                 stat['url'] = flow.request.url
-            flow.response.headers['content-type'] = ["text/html"]
-            if 'content-encoding' in flow.response.headers.keys():
+            flow.response.headers['content-type'] = "text/html"
+            if 'content-encoding' in list(flow.response.headers.keys()):
+                import pdb;pdb.set_trace()
                 flow.response.content = flow.response.get_decoded_content()
                 del flow.response.headers['content-encoding']
-            page = BeautifulSoup(flow.response.get_decoded_content())
+            page = BeautifulSoup(flow.response.content.decode())
             lang = detectLanguage(page)
             lang = lang if lang in tag_expressions or lang in content_expressions else tag_expressions['fallback']
             if lang in tag_expressions:
                 for tag in page.findAll(text=True):
                     if type(tag) == NavigableString:
-                        string = unicode(tag.string)
+                        string = str(tag.string)
                         for key, value in tag_expressions[lang]:
                             value_rand = random.choice(value)
                             if not replace:
@@ -104,7 +109,7 @@ def censorText(flow, tag_expressions, content_expressions, stylesheet, send_stat
                                 stats['changes'].append(replace_data[1])
                         tag.string.replace_with(string)
             page = injectCSS(page, stylesheet)
-            flow.response.content = str(page)
+            flow.response.set_content(str(page).encode())
             if lang in content_expressions:
                 for key, value in content_expressions[lang]:
                     flow.response.content = re.sub(key, random.choice(value), flow.response.content)

diff --git a/requirements.txt b/requirements.txt
@@ -1,26 +1,5 @@
-backports.ssl-match-hostname==3.4.0.2
-beautifulsoup4==4.3.2
-blinker==1.3
-certifi==2015.4.28
-cffi==1.4.1
-ConfigArgParse==0.9.3
-configparser
-enum34==1.0.4
-hpack==1.0.1
-idna==2.0
-ipaddress==1.0.7
-lxml==3.4.4
-mitmproxy==0.12.1
-netlib==0.12.1
-passlib==1.6.2
-Pillow==2.8.2
-pyasn1==0.1.7
-pycparser==2.13
-pyOpenSSL==0.15.1
-pyperclip==1.5.11
-requests==2.7.0
-six==1.9.0
-tornado==4.2
-urwid==1.3.0
-Wand==0.4.0
-wheel==0.24.0
+beautifulsoup4
+lxml
+mitmproxy
+Pillow
+requests