In [1]:
from classes import *
import numpy as np, random, operator, pandas as pd, matplotlib.pyplot as plt


In [2]:
class Fitness:
    def __init__(self, route):
        self.route = route
        self.distance = 0
        self.fitness= 0.0
    
    def routeDistance(self):
        if self.distance ==0:
            pathDistance = 0
            for i in range(0, len(self.route)):
                fromCity = self.route[i]
                toCity = None
                if i + 1 < len(self.route):
                    toCity = self.route[i + 1]
                else:
                    toCity = self.route[0]
                pathDistance += fromCity.distance(toCity)
            self.distance = pathDistance
        return self.distance
    
    def routeFitness(self):
        if self.fitness == 0:
            self.fitness = 1 / float(self.routeDistance())
        return self.fitness

In [3]:
def createRoute(cityList):
    route = random.sample(cityList, len(cityList))
    return route

In [4]:
def initialPopulation(popSize, cityList):
    population = []

    for i in range(0, popSize):
        population.append(createRoute(cityList))
    return population

In [5]:
def rankRoutes(population):
    fitnessResults = {}
    for i in range(0,len(population)):
        fitnessResults[i] = Fitness(population[i]).routeFitness()
    return sorted(fitnessResults.items(), key = operator.itemgetter(1), reverse = True)

In [6]:
def selection(popRanked, eliteSize):
    selectionResults = []
    df = pd.DataFrame(np.array(popRanked), columns=["Index","Fitness"])
    df['cum_sum'] = df.Fitness.cumsum()
    df['cum_perc'] = 100*df.cum_sum/df.Fitness.sum()
    
    for i in range(0, eliteSize):
        selectionResults.append(popRanked[i][0])
    for i in range(0, len(popRanked) - eliteSize):
        pick = 100*random.random()
        for i in range(0, len(popRanked)):
            if pick <= df.iat[i,3]:
                selectionResults.append(popRanked[i][0])
                break
    return selectionResults

In [7]:
def matingPool(population, selectionResults):
    matingpool = []
    for i in range(0, len(selectionResults)):
        index = selectionResults[i]
        matingpool.append(population[index])
    return matingpool

In [8]:
def breed(parent1, parent2):
    child = []
    childP1 = []
    childP2 = []
    
    geneA = int(random.random() * len(parent1))
    geneB = int(random.random() * len(parent1))
    
    startGene = min(geneA, geneB)
    endGene = max(geneA, geneB)

    for i in range(startGene, endGene):
        childP1.append(parent1[i])
        
    childP2 = [item for item in parent2 if item not in childP1]

    child = childP1 + childP2
    return child

In [9]:
def breedPopulation(matingpool, eliteSize):
    children = []
    length = len(matingpool) - eliteSize
    pool = random.sample(matingpool, len(matingpool))

    for i in range(0,eliteSize):
        children.append(matingpool[i])
    
    for i in range(0, length):
        child = breed(pool[i], pool[len(matingpool)-i-1])
        children.append(child)
    return children

In [10]:
def mutate(individual, mutationRate):
    for swapped in range(len(individual)):
        if(random.random() < mutationRate):
            swapWith = int(random.random() * len(individual))
            
            city1 = individual[swapped]
            city2 = individual[swapWith]
            
            individual[swapped] = city2
            individual[swapWith] = city1
    return individual

In [11]:
def mutatePopulation(population, mutationRate):
    mutatedPop = []
    
    for ind in range(0, len(population)):
        mutatedInd = mutate(population[ind], mutationRate)
        mutatedPop.append(mutatedInd)
    return mutatedPop

In [12]:
def nextGeneration(currentGen, eliteSize, mutationRate):
    popRanked = rankRoutes(currentGen)
    selectionResults = selection(popRanked, eliteSize)
    matingpool = matingPool(currentGen, selectionResults)
    children = breedPopulation(matingpool, eliteSize)
    nextGeneration = mutatePopulation(children, mutationRate)
    return nextGeneration

In [13]:
def geneticAlgorithm(population, popSize, eliteSize, mutationRate, generations):
    pop = initialPopulation(popSize, population)
    print("Initial distance: " + str(1 / rankRoutes(pop)[0][1]))
    
    for i in range(0, generations):
        if (i%10 == 0):
            print("-- iteration %d -- " % i)
        pop = nextGeneration(pop, eliteSize, mutationRate)
    
    print("Final distance: " + str(1 / rankRoutes(pop)[0][1]))
    bestRouteIndex = rankRoutes(pop)[0][0]
    bestRoute = pop[bestRouteIndex]
    return bestRoute

In [14]:
import joblib as jb

def write_Slideshow_to_file(slideshow, output_name = "sexybaby.txt"):
    with open(output_name, "w") as file:
        file.write("{}\n".format(len(slideshow.slides)))
        for slide in slideshow.slides:
            ID = slide.id
            if len(ID) == 1:
                file.write("{}\n".format(ID[0]))
            else:
                file.write("{} {}\n".format(ID[0], ID[1]))

#Create a set of slides following the rationale of the groupment by biggest tags
def get_horizontals_from_collection(collection, groupby="average", filename=""):
    
    #Create a set of vertical and horizontal pictures
    null_photo = Photo(orientation="", tags=[])
    collection_V = []
    collection_H = []

    for photo in collection:
        if photo.orientation == "V":
            collection_V.append(photo)
        else:
            collection_H.append(photo)

    ##### Sort pictures in place by number of tags
    collection_V.sort(key=lambda photo: len(photo.tags), reverse=True)
    collection_H.sort(key=lambda photo: len(photo.tags), reverse=True)
    
    ##### generate slides
    m = len(collection_V)
    slides_fromVerticals = []
    index = 0
    if groupby == "2by2":
        while index < m:
            slides_fromVerticals.append(Slide([collection_V[index], collection_V[index+1]]))
            index += 2
    else:
        if m %2 == 1:
            collection_V = collection_V[1:]
        for i in range(m//2):
            slides_fromVerticals.append(Slide([collection_V[m - 1 - i], collection_V[i]]))
    
    slides_fromHorizontals = [Slide([photo]) for photo in collection_H]
    jb.dump(collection_V, "collection_V_{}.joblib".format(filename))
    jb.dump(collection_H, "collection_H_{}.joblib".format(filename))
    jb.dump(slides_fromVerticals, "slides_fromVerticals_{}_{}.joblib".format(groupby,filename))
    jb.dump(slides_fromHorizontals, "slides_fromHorizontals_{}.joblib".format(filename))
    return slides_fromVerticals, slides_fromHorizontals

def get_horizontals_from_file(filename, groupby="average"):
    return jb.load("slides_fromVerticals_{}_{}.joblib".format(groupby, filename)), jb.load("slides_fromHorizontals_{}.joblib".format(filename))

In [15]:
Photo.id_counter = 0

In [16]:
import input_output as io
photos = io.read("c_memorable_moments.txt")
slides_fromVerticals, slides_fromHorizontals = get_horizontals_from_collection(photos, groupby="average")
slides = slides_fromVerticals + slides_fromHorizontals

In [17]:
a = geneticAlgorithm(population=slides, popSize=100, eliteSize=20, mutationRate=0.01, generations=200) 

Initial distance: -172.0
-- iteration 0 -- 
-- iteration 10 -- 
-- iteration 20 -- 
-- iteration 30 -- 
-- iteration 40 -- 
-- iteration 50 -- 
-- iteration 60 -- 
-- iteration 70 -- 
-- iteration 80 -- 
-- iteration 90 -- 
-- iteration 100 -- 
-- iteration 110 -- 
-- iteration 120 -- 
-- iteration 130 -- 
-- iteration 140 -- 
-- iteration 150 -- 
-- iteration 160 -- 
-- iteration 170 -- 
-- iteration 180 -- 
-- iteration 190 -- 
Final distance: -226.99999999999997


In [18]:
a

[id= (631, 424), tags= {'td7', 't1k1', 't0l1', 'tbv', 't161', 't7q1', 'tlh1', 'twz', 'tz61', 'tr82', 'tbp1', 'tjb1', 'tq91', 't9z1', 't0g1', 'tqj', 'tqb2', 'tl72', 'tbv1'},
 id= (627,), tags= {'t32', 'tv32', 'tpb2', 't6r', 'tn12', 'tvs1', 't8n', 't332', 'tt02', 'tz61', 't0s'},
 id= (532,), tags= {'tw81', 't3w', 'tfz', 't3k', 't8l', 't651', 't0x', 'tnz1', 'tz22', 't001', 'tjn'},
 id= (107,), tags= {'tgq1', 'tl6', 't9h', 'tnm', 'tf22', 'tsr1'},
 id= (629,), tags= {'tw81', 't3m', 'tpb', 't1j1', 't391', 't512', 'tt21', 't6t', 't8s', 'ttc', 't432', 't152'},
 id= (974, 894), tags= {'tgc', 'th1', 'ttr1', 't88', 'tl3', 't6x', 'tnf', 'td41', 't6t', 'ttt', 't0w1', 'tr2', 'tf2', 'thg1', 't561', 'tt32', 'tjj1', 't511', 'tk6', 'tjc2'},
 id= (421,), tags= {'tbw1', 'tsw', 'th42', 'tfj', 't672', 'tdp', 't692', 'tb92', 'th11'},
 id= (55, 801), tags= {'td7', 'tq11', 't0j1', 'td', 'tpg1', 'tjx1', 't481', 'tfj', 'tpr1', 'tcb2', 'tkt1', 'tpd', 'tn3', 't7p1', 't28', 't181', 'tb92', 'twv1', 'tvp'},
 id= (84,

In [19]:
sh = SlideShow(a, None)

In [20]:
write_Slideshow_to_file(sh, "output_c.txt")

In [21]:
Photo.id_counter = 0

In [22]:
import input_output as io
photos = io.read("b_lovely_landscapes.txt")
slides_fromVerticals, slides_fromHorizontals = get_horizontals_from_collection(photos, groupby="average")
slides = slides_fromVerticals + slides_fromHorizontals

In [23]:
b_file = geneticAlgorithm(population=slides, popSize=100, eliteSize=20, mutationRate=0.01, generations=200) 

ZeroDivisionError: float division by zero

In [None]:
sh_b = SlideShow(b_file, None)
write_Slideshow_to_file(sh_b, "output_b.txt")

In [None]:
Photo.id_counter = 0

In [None]:
import input_output as io
photos = io.read("d_pet_pictures.txt")
slides_fromVerticals, slides_fromHorizontals = get_horizontals_from_collection(photos, groupby="average")
slides = slides_fromVerticals + slides_fromHorizontals
d_file = geneticAlgorithm(population=slides, popSize=100, eliteSize=20, mutationRate=0.01, generations=200) 

In [None]:
sh_d = SlideShow(d_file, None)
write_Slideshow_to_file(sh_d, "output_d.txt")

In [None]:
Photo.id_counter = 0

In [None]:
import input_output as io
photos = io.read("e_shiny_selfies.txt")
slides_fromVerticals, slides_fromHorizontals = get_horizontals_from_collection(photos, groupby="average")
slides = slides_fromVerticals + slides_fromHorizontals
e_file = geneticAlgorithm(population=slides, popSize=100, eliteSize=20, mutationRate=0.01, generations=200) 
sh_e = SlideShow(e_file, None)
write_Slideshow_to_file(sh_e, "output_e.txt")

In [None]:
Photo.id_counter = 0

In [None]:
import input_output as io
photos = io.read("a_example.txt")
slides_fromVerticals, slides_fromHorizontals = get_horizontals_from_collection(photos, groupby="average")
slides = slides_fromVerticals + slides_fromHorizontals
a_file = geneticAlgorithm(population=slides, popSize=100, eliteSize=20, mutationRate=0.01, generations=200) 
sh_a = SlideShow(a_file, None)
write_Slideshow_to_file(sh_a, "output_a.txt")