In [1]:
from io import BytesIO
import pycurl,timeit
from multiprocessing import Process
from multiprocessing import Manager

# Performance with proxy

In [2]:
def proxy_latency(prox_type,host,port,target,return_list):
    buffer = BytesIO()
    c = pycurl.Curl()
    c.setopt(pycurl.PROXY, f"{host}:{port}")
    c.setopt(pycurl.URL, target)
    c.setopt(c.WRITEDATA, buffer)
    ts = timeit.default_timer()
    c.perform()
    
    m = {}
    m['prox_type'] = prox_type
    m['target'] = target
    m['total-time'] = c.getinfo(pycurl.TOTAL_TIME)
    m['namelookup-time'] = c.getinfo(pycurl.NAMELOOKUP_TIME)
    m['connect-time'] = c.getinfo(pycurl.CONNECT_TIME)
    m['pretransfer-time'] = c.getinfo(pycurl.PRETRANSFER_TIME)
    m['starttransfer-time'] = c.getinfo(pycurl.STARTTRANSFER_TIME)
    
    return_list.append(m)
    
    c.close()
    
    return m


# Performance without proxy

In [3]:
def normal_latency(port,target,return_list):
    buffer = BytesIO()
    c = pycurl.Curl()
    c.setopt(pycurl.URL, target)
    c.setopt(c.WRITEDATA, buffer)
    ts = timeit.default_timer()
    c.perform()
    
    m = {}
    m['prox_type'] = "N/A"
    m['target'] = target
    m['total-time'] = c.getinfo(pycurl.TOTAL_TIME)
    m['namelookup-time'] = c.getinfo(pycurl.NAMELOOKUP_TIME)
    m['connect-time'] = c.getinfo(pycurl.CONNECT_TIME)
    m['pretransfer-time'] = c.getinfo(pycurl.PRETRANSFER_TIME)
    m['starttransfer-time'] = c.getinfo(pycurl.STARTTRANSFER_TIME)
    
    return_list.append(m)
    
    c.close()
    

# Setup

In [4]:
host = "130.64.148.78"
port = "8080"
range_k = 100



# target = "https://github.com/"

target = "http://www.cs.cmu.edu/~prs/bio.html"


# target = "http://www.cs.tufts.edu/comp/112/"

# Without proxy

## 1. One time

In [5]:
return_list = []
normal_latency(port,target,return_list)
print(return_list[0])

{'prox_type': 'N/A', 'target': 'http://www.cs.cmu.edu/~prs/bio.html', 'total-time': 0.341654, 'namelookup-time': 0.005058, 'connect-time': 0.022789, 'pretransfer-time': 0.022873, 'starttransfer-time': 0.306076}


## 2. Average time (100 request)

In [6]:
total = 0
return_list = []
for n in range(range_k):
    result = normal_latency(port,target,return_list)

for result in return_list: 
    total+= result["total-time"]
    
total/range_k

0.12766182

# Our project - select + pthread

In [7]:
prox_type = "select"

## 1. One time without cache

In [8]:
return_list = []
proxy_latency(prox_type,host,port,target,return_list)
print(return_list[0])

{'prox_type': 'select', 'target': 'http://www.cs.cmu.edu/~prs/bio.html', 'total-time': 0.075657, 'namelookup-time': 5.9e-05, 'connect-time': 0.000188, 'pretransfer-time': 0.00025, 'starttransfer-time': 0.075588}


## 2. Average time with cache (100 reqests)

In [9]:
total = 0
return_list = []
for n in range(range_k):
    proxy_latency(prox_type,host,port,target,return_list)

    
for result in return_list: 
    total+= result["total-time"]
    
total/range_k

0.00048904

# Fully fork version - without cache

In [10]:
# prox_type = "fork"


In [11]:
# total = 0

# for n in range(range_k):
#    result = proxy_latency(prox_type,host,port,target)
#    total+= result["total-time"]
    
# total/range_k

# Fully pthread version - without cache

In [12]:
# prox_type = "pthread"

In [13]:
# total = 0

# for n in range(range_k):
#    result = proxy_latency(prox_type,host,port,target)
#    total+= result["total-time"]
    
# total/range_k

# Simulate multi users - multiprocesses

## Without proxy - http, 50 request

In [14]:
manager = Manager()
return_list = manager.list()
jobs = []
total = 0

for i in range(range_k):
    p = Process(target=normal_latency,args=(port,target,return_list))
    jobs.append(p)
    p.start()

for proc in jobs:
    proc.join()

for item in return_list:
    total+=item["total-time"]

total/range_k    

0.4735701200000002

## Proxy - http with cache, 50 request

In [15]:
manager = Manager()
return_list = manager.list()
jobs = []
total = 0

for i in range(range_k):
    p = Process(target=proxy_latency,args=(prox_type,host,port,target,return_list))
    jobs.append(p)
    p.start()

for proc in jobs:
    proc.join()

for item in return_list:
    total+=item["total-time"]

total/range_k  

0.0007377399999999996

In [16]:
target = "https://github.com/"
range_k = 200

## Without proxy - https, 50 request

In [23]:
manager = Manager()
return_list = manager.list()
jobs = []
total = 0

for i in range(range_k):
    p = Process(target=normal_latency,args=(port,target,return_list))
    jobs.append(p)
    p.start()

for proc in jobs:
    proc.join()

for item in return_list:
    total+=item["total-time"]

total/range_k    

1.5326971750000007

## Proxy - https withoutcache, 50 request

In [24]:
manager = Manager()
return_list = manager.list()
jobs = []
total = 0

for i in range(range_k):
    p = Process(target=proxy_latency,args=(prox_type,host,port,target,return_list))
    jobs.append(p)
    p.start()

for proc in jobs:
    proc.join()

for item in return_list:
    total+=item["total-time"]

total/range_k 

1.1123836000000002

In [19]:
# 10: https noproxy: 0.21 select+pthread: 0.33 select: 0.48  fork: 0.24
# 50: https noproxy: 0.42 select+pthread: 1.35 select: 2.11  fork: 0.39
# 100: https noproxy: 0.78 select+pthread: 2.24 select: 3.32 fork: 0.74
# 200: https noproxy: 1.26 select+pthread: 4.12 select: 7.11 fork: 1.11

In [None]:
# Single reqest
# https noproxy: 0.17 select+pthread: 0.18 select: 0.21 fork: 0.21