In [1]:
from classes import *
import numpy as np, random, operator, pandas as pd, matplotlib.pyplot as plt


In [2]:
class Fitness:
    def __init__(self, route):
        self.route = route
        self.distance = 0
        self.fitness= 0.0
    
    def routeDistance(self):
        if self.distance ==0:
            pathDistance = 0
            for i in range(0, len(self.route)):
                fromCity = self.route[i]
                toCity = None
                if i + 1 < len(self.route):
                    toCity = self.route[i + 1]
                else:
                    toCity = self.route[0]
                pathDistance += fromCity.distance(toCity)
            self.distance = pathDistance
        return self.distance
    
    def routeFitness(self):
        if self.fitness == 0:
            self.fitness = 1 / float(self.routeDistance())
        return self.fitness

In [3]:
def createRoute(cityList):
    route = random.sample(cityList, len(cityList))
    return route

In [4]:
def initialPopulation(popSize, cityList):
    population = []

    for i in range(0, popSize):
        population.append(createRoute(cityList))
    return population

In [5]:
def rankRoutes(population):
    fitnessResults = {}
    for i in range(0,len(population)):
        fitnessResults[i] = Fitness(population[i]).routeFitness()
    return sorted(fitnessResults.items(), key = operator.itemgetter(1), reverse = True)

In [6]:
def selection(popRanked, eliteSize):
    selectionResults = []
    df = pd.DataFrame(np.array(popRanked), columns=["Index","Fitness"])
    df['cum_sum'] = df.Fitness.cumsum()
    df['cum_perc'] = 100*df.cum_sum/df.Fitness.sum()
    
    for i in range(0, eliteSize):
        selectionResults.append(popRanked[i][0])
    for i in range(0, len(popRanked) - eliteSize):
        pick = 100*random.random()
        for i in range(0, len(popRanked)):
            if pick <= df.iat[i,3]:
                selectionResults.append(popRanked[i][0])
                break
    return selectionResults

In [7]:
def matingPool(population, selectionResults):
    matingpool = []
    for i in range(0, len(selectionResults)):
        index = selectionResults[i]
        matingpool.append(population[index])
    return matingpool

In [8]:
def breed(parent1, parent2):
    child = []
    childP1 = []
    childP2 = []
    
    geneA = int(random.random() * len(parent1))
    geneB = int(random.random() * len(parent1))
    
    startGene = min(geneA, geneB)
    endGene = max(geneA, geneB)

    for i in range(startGene, endGene):
        childP1.append(parent1[i])
        
    childP2 = [item for item in parent2 if item not in childP1]

    child = childP1 + childP2
    return child

In [9]:
def breedPopulation(matingpool, eliteSize):
    children = []
    length = len(matingpool) - eliteSize
    pool = random.sample(matingpool, len(matingpool))

    for i in range(0,eliteSize):
        children.append(matingpool[i])
    
    for i in range(0, length):
        child = breed(pool[i], pool[len(matingpool)-i-1])
        children.append(child)
    return children

In [10]:
def mutate(individual, mutationRate):
    for swapped in range(len(individual)):
        if(random.random() < mutationRate):
            swapWith = int(random.random() * len(individual))
            
            city1 = individual[swapped]
            city2 = individual[swapWith]
            
            individual[swapped] = city2
            individual[swapWith] = city1
    return individual

In [11]:
def mutatePopulation(population, mutationRate):
    mutatedPop = []
    
    for ind in range(0, len(population)):
        mutatedInd = mutate(population[ind], mutationRate)
        mutatedPop.append(mutatedInd)
    return mutatedPop

In [12]:
def nextGeneration(currentGen, eliteSize, mutationRate):
    popRanked = rankRoutes(currentGen)
    selectionResults = selection(popRanked, eliteSize)
    matingpool = matingPool(currentGen, selectionResults)
    children = breedPopulation(matingpool, eliteSize)
    nextGeneration = mutatePopulation(children, mutationRate)
    return nextGeneration

In [29]:
def geneticAlgorithm(population, popSize, eliteSize, mutationRate, generations):
    pop = initialPopulation(popSize, population)
    print("Initial distance: " + str(1 / rankRoutes(pop)[0][1]))
    
    for i in range(0, generations):
        if (i%10 == 0):
            print("-- iteration %d -- " % i)
        pop = nextGeneration(pop, eliteSize, mutationRate)
    
    print("Final distance: " + str(1 / rankRoutes(pop)[0][1]))
    bestRouteIndex = rankRoutes(pop)[0][0]
    bestRoute = pop[bestRouteIndex]
    return bestRoute

In [14]:
import joblib as jb

def write_Slideshow_to_file(slideshow, output_name = "sexybaby.txt"):
    with open(output_name, "w") as file:
        file.write("{}\n".format(len(slideshow.slides)))
        for slide in slideshow.slides:
            ID = slide.id
            if len(ID) == 1:
                file.write("{}\n".format(ID[0]))
            else:
                file.write("{} {}\n".format(ID[0], ID[1]))

#Create a set of slides following the rationale of the groupment by biggest tags
def get_horizontals_from_collection(collection, groupby="average", filename=""):
    
    #Create a set of vertical and horizontal pictures
    null_photo = Photo(orientation="", tags=[])
    collection_V = []
    collection_H = []

    for photo in collection:
        if photo.orientation == "V":
            collection_V.append(photo)
        else:
            collection_H.append(photo)

    ##### Sort pictures in place by number of tags
    collection_V.sort(key=lambda photo: len(photo.tags), reverse=True)
    collection_H.sort(key=lambda photo: len(photo.tags), reverse=True)
    
    ##### generate slides
    m = len(collection_V)
    slides_fromVerticals = []
    index = 0
    if groupby == "2by2":
        while index < m:
            slides_fromVerticals.append(Slide([collection_V[index], collection_V[index+1]]))
            index += 2
    else:
        if m %2 == 1:
            collection_V = collection_V[1:]
        for i in range(m//2):
            slides_fromVerticals.append(Slide([collection_V[m - 1 - i], collection_V[i]]))
    
    slides_fromHorizontals = [Slide([photo]) for photo in collection_H]
    jb.dump(collection_V, "collection_V_{}.joblib".format(filename))
    jb.dump(collection_H, "collection_H_{}.joblib".format(filename))
    jb.dump(slides_fromVerticals, "slides_fromVerticals_{}_{}.joblib".format(groupby,filename))
    jb.dump(slides_fromHorizontals, "slides_fromHorizontals_{}.joblib".format(filename))
    return slides_fromVerticals, slides_fromHorizontals

def get_horizontals_from_file(filename, groupby="average"):
    return jb.load("slides_fromVerticals_{}_{}.joblib".format(groupby, filename)), jb.load("slides_fromHorizontals_{}.joblib".format(filename))

In [None]:
Photo.id_counter = 0

In [15]:
import input_output as io
photos = io.read("c_memorable_moments.txt")
slides_fromVerticals, slides_fromHorizontals = get_horizontals_from_collection(photos, groupby="average")
slides = slides_fromVerticals + slides_fromHorizontals

In [16]:
a = geneticAlgorithm(population=slides, popSize=100, eliteSize=20, mutationRate=0.01, generations=500) 

Initial distance: -166.0
0 th distance: -166.0
10 th distance: -183.0
20 th distance: -210.99999999999997
30 th distance: -216.0
40 th distance: -223.0
50 th distance: -226.99999999999997
60 th distance: -220.0
70 th distance: -220.99999999999997
80 th distance: -225.0
90 th distance: -222.0
100 th distance: -226.0
110 th distance: -230.0
120 th distance: -226.0
130 th distance: -229.0
140 th distance: -226.0
150 th distance: -226.99999999999997
160 th distance: -224.0
170 th distance: -236.0
180 th distance: -236.0
190 th distance: -233.0
200 th distance: -232.0
210 th distance: -229.0
220 th distance: -230.0
230 th distance: -220.0
240 th distance: -233.99999999999997
250 th distance: -226.99999999999997
260 th distance: -226.0
270 th distance: -237.00000000000003
280 th distance: -236.0
290 th distance: -225.0
300 th distance: -225.0
310 th distance: -232.0
320 th distance: -236.0
330 th distance: -226.99999999999997
340 th distance: -226.99999999999997
350 th distance: -228.0
360 t

In [17]:
a

[id= (309,), tags= {'tz1', 'tbv', 'tpc1', 't2z1', 'tvs1', 'tjz', 'td22', 't221'},
 id= (676, 318), tags= {'t8l', 'tdn', 'tqk1', 'tft', 'tgg', 'td', 'tpr1', 't1', 'tbl', 'tmk', 't7j1', 't741', 'tm4', 't6d2', 'tt72', 't1g1', 't1z', 'tx42', 'th1'},
 id= (374,), tags= {'t492', 't3c1', 'tfz1', 't8l1', 'tm8', 't6'},
 id= (77,), tags= {'tr92', 't3n', 'tdb2', 't76', 'tz42', 't512', 'tr51'},
 id= (314,), tags= {'t2m1', 'tjl', 'tv81', 'tb32', 'tz91', 'tx62', 'tn42', 'ttb2', 't011', 'th1', 'tr2', 'tvk', 't7p1', 'tm'},
 id= (166,), tags= {'tk31', 't0j1', 't002', 'tkr1', 't052', 'tb12', 't3t', 't8c1', 't8j', 't39', 't2x1', 'td72'},
 id= (102, 805), tags= {'td41', 't3k', 't8t1', 't4d2', 't161', 'tmj1', 't002', 't9p1', 'tf3', 'th42', 'tss1', 't33', 'tn4', 't39', 't471', 'tr91', 'tm42', 't0l1', 't7n'},
 id= (11,), tags= {'t991', 't0t1', 'tp72', 'tnl', 'twn1', 'ttx1', 't4q1', 'tkn', 'th61', 't7n1', 'tkc2', 'tt'},
 id= (209,), tags= {'tl72', 'thg1', 't181', 'tmf', 'tvr', 'tt', 'tl51'},
 id= (720, 270), 

In [21]:
sh = SlideShow(a, None)

In [22]:
write_Slideshow_to_file(sh, "output_c.txt")

In [30]:
Photo.id_counter = 0

In [43]:
import input_output as io
photos = io.read("b_lovely_landscapes.txt")
slides_fromVerticals, slides_fromHorizontals = get_horizontals_from_collection(photos, groupby="average")
slides = slides_fromVerticals + slides_fromHorizontals

In [44]:
b_file = geneticAlgorithm(population=slides, popSize=100, eliteSize=20, mutationRate=0.01, generations=200) 

Initial distance: -33.0
-- iteration 0 -- 


KeyboardInterrupt: 

In [None]:
sh_b = SlideShow(b_file, None)
write_Slideshow_to_file(sh_b, "output_b.txt")

In [None]:
Photo.id_counter = 0

In [None]:
import input_output as io
photos = io.read("d_pet_pictures.txt")
slides_fromVerticals, slides_fromHorizontals = get_horizontals_from_collection(photos, groupby="average")
slides = slides_fromVerticals + slides_fromHorizontals
d_file = geneticAlgorithm(population=slides, popSize=100, eliteSize=20, mutationRate=0.01, generations=200) 

In [None]:
sh_d = SlideShow(d_file, None)
write_Slideshow_to_file(sh_d, "output_d.txt")

In [34]:
Photo.id_counter = 0

In [None]:
import input_output as io
photos = io.read("e_shiny_selfies.txt")
slides_fromVerticals, slides_fromHorizontals = get_horizontals_from_collection(photos, groupby="average")
slides = slides_fromVerticals + slides_fromHorizontals
e_file = geneticAlgorithm(population=slides, popSize=100, eliteSize=20, mutationRate=0.01, generations=200) 
sh_e = SlideShow(e_file, None)
write_Slideshow_to_file(sh_e, "output_e.txt")

In [None]:
Photo.id_counter = 0

In [None]:
import input_output as io
photos = io.read("a_example.txt")
slides_fromVerticals, slides_fromHorizontals = get_horizontals_from_collection(photos, groupby="average")
slides = slides_fromVerticals + slides_fromHorizontals
a_file = geneticAlgorithm(population=slides, popSize=100, eliteSize=20, mutationRate=0.01, generations=200) 
sh_a = SlideShow(a_file, None)
write_Slideshow_to_file(sh_a, "output_a.txt")