Initial commit.

HackerPoet · Aug 5, 2018 · a23c70b · a23c70b
commit a23c70b
Show file tree

Hide file tree

Showing 6 changed files with 484 additions and 0 deletions.
diff --git a/cpu.theanorc b/cpu.theanorc
@@ -0,0 +1,3 @@
+[global]
+floatX=float32
+device=cpu
diff --git a/datagen.py b/datagen.py
@@ -0,0 +1,71 @@
+import os, random, sys
+import numpy as np
+import cv2
+from dutil import *
+
+NUM_IMAGES = 1769
+SAMPLES_PER_IMG = 10
+DOTS_PER_IMG = 60
+IMAGE_W = 144
+IMAGE_H = 192
+IMAGE_DIR = 'YB_PICTURES'
+NUM_SAMPLES = NUM_IMAGES * 2 * SAMPLES_PER_IMG
+
+def center_resize(img):
+	assert(IMAGE_W == IMAGE_H)
+	w, h = img.shape[0], img.shape[1]
+	if w > h:
+		x = (w-h)/2
+		img = img[x:x+h,:]
+	elif h > w:
+		img = img[:,0:w]
+	return cv2.resize(img, (IMAGE_W, IMAGE_H), interpolation = cv2.INTER_LINEAR)
+
+def yb_resize(img):
+	assert(img.shape[1] == 151)
+	assert(img.shape[0] == 197)
+	return cv2.resize(img, (IMAGE_W, IMAGE_H), interpolation = cv2.INTER_LINEAR)
+
+def rand_dots(img, sample_ix):
+	sample_ratio = float(sample_ix) / SAMPLES_PER_IMG
+	return auto_canny(img, sample_ratio)
+
+x_data = np.empty((NUM_SAMPLES, NUM_CHANNELS, IMAGE_H, IMAGE_W), dtype=np.uint8)
+y_data = np.empty((NUM_SAMPLES, 3, IMAGE_H, IMAGE_W), dtype=np.uint8)
+ix = 0
+for root, subdirs, files in os.walk(IMAGE_DIR):
+	for file in files:
+		path = root + "\\" + file
+		if not (path.endswith('.jpg') or path.endswith('.png')):
+			continue
+		img = cv2.imread(path)
+		if img is None:
+			assert(False)
+		if len(img.shape) != 3 or img.shape[2] != 3:
+			assert(False)
+		if img.shape[0] < IMAGE_H or img.shape[1] < IMAGE_W:
+			assert(False)
+		img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
+		img = yb_resize(img)
+		for i in xrange(SAMPLES_PER_IMG):
+			y_data[ix] = np.transpose(img, (2, 0, 1))
+			x_data[ix] = rand_dots(img, i)
+			if ix < SAMPLES_PER_IMG*16:
+				outimg = x_data[ix][0]
+				cv2.imwrite('cargb' + str(ix) + '.png', outimg)
+				print path
+			ix += 1
+			y_data[ix] = np.flip(y_data[ix - 1], axis=2)
+			x_data[ix] = np.flip(x_data[ix - 1], axis=2)
+			ix += 1
+
+		sys.stdout.write('\r')
+		progress = ix * 100 / NUM_SAMPLES
+		sys.stdout.write(str(progress) + "%")
+		sys.stdout.flush()
+		assert(ix <= NUM_SAMPLES)
+
+assert(ix == NUM_SAMPLES)
+print "Saving..."
+np.save('x_data.npy', x_data)
+np.save('y_data.npy', y_data)
diff --git a/dutil.py b/dutil.py
@@ -0,0 +1,27 @@
+import numpy as np
+import cv2
+
+def add_pos(arr):
+	s = arr.shape
+	result = np.empty((s[0], s[1] + 2, s[2], s[3]), dtype=np.float32)
+	result[:,:s[1],:,:] = arr
+	x = np.repeat(np.expand_dims(np.arange(s[3]) / float(s[3]), axis=0), s[2], axis=0)
+	y = np.repeat(np.expand_dims(np.arange(s[2]) / float(s[2]), axis=0), s[3], axis=0)
+	result[:,s[1] + 0,:,:] = x
+	result[:,s[1] + 1,:,:] = np.transpose(y)
+	return result
+
+def auto_canny(image, sigma=0.0):
+	gray = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)
+	grayed = np.where(gray < 20, 255, 0)
+
+	lower = sigma*128 + 128
+	upper = 255
+	edged = cv2.Canny(image, lower, upper)
+
+	return np.maximum(edged, grayed)
+
+def save_image(x, fname):
+	img = np.transpose(x * 255, (1, 2, 0))
+	img = cv2.cvtColor(img.astype(np.uint8), cv2.COLOR_RGB2BGR)
+	cv2.imwrite(fname, img)
diff --git a/encoder.py b/encoder.py
@@ -0,0 +1,182 @@
+import sys, random
+import numpy as np
+from matplotlib import pyplot as plt
+from dutil import *
+import pydot
+
+SHIFT_AMOUNT = 9
+BATCH_SIZE = 8
+NUM_KERNELS = 20
+CONTINUE_TRAIN = False
+
+NUM_EPOCHS = 2000
+PARAM_SIZE = 80
+LR = 0.001
+NUM_RAND_FACES = BATCH_SIZE
+NUM_TEST_FACES = BATCH_SIZE
+
+def plotScores(scores, test_scores, fname, on_top=True):
+	plt.clf()
+	ax = plt.gca()
+	ax.yaxis.tick_right()
+	ax.yaxis.set_ticks_position('both')
+	ax.yaxis.grid(True)
+	plt.plot(scores)
+	plt.plot(test_scores)
+	plt.xlabel('Epoch')
+	plt.ylim([0.0, 0.01])
+	loc = ('upper right' if on_top else 'lower right')
+	plt.legend(['Train', 'Test'], loc=loc)
+	plt.draw()
+	plt.savefig(fname)
+
+#Load data set
+print "Loading Data..."
+y_train = np.load('y_data.npy').astype(np.float32) / 255.0
+y_train = y_train[:y_train.shape[0] - y_train.shape[0] % BATCH_SIZE]
+x_train = np.expand_dims(np.arange(y_train.shape[0]), axis=1)
+num_samples = y_train.shape[0]
+print "Loaded " + str(num_samples) + " Samples."
+
+###################################
+#  Create Model
+###################################
+print "Loading Keras..."
+import os, math
+os.environ['THEANORC'] = "./gpu.theanorc"
+os.environ['KERAS_BACKEND'] = "theano"
+import theano
+print "Theano Version: " + theano.__version__
+
+from keras.initializers import RandomUniform
+from keras.layers import Input, Dense, Activation, Dropout, Flatten, Reshape, SpatialDropout2D
+from keras.layers.convolutional import Conv2D, Conv2DTranspose, UpSampling2D
+from keras.layers.embeddings import Embedding
+from keras.layers.local import LocallyConnected2D
+from keras.layers.pooling import MaxPooling2D
+from keras.layers.noise import GaussianNoise
+from keras.models import Model, Sequential, load_model
+from keras.optimizers import Adam, RMSprop, SGD
+from keras.preprocessing.image import ImageDataGenerator
+from keras.regularizers import l1
+from keras.utils import plot_model
+from keras import backend as K
+from custom_layers import BinaryEncoder, PATCON
+K.set_image_data_format('channels_first')
+
+if CONTINUE_TRAIN:
+	print "Loading Model..."
+	model = load_model('Encoder.h5')
+else:
+	print "Building Model..."
+	model = Sequential()
+
+	model.add(Embedding(num_samples, PARAM_SIZE, input_length=1))
+	model.add(Flatten(name='pre_encoder'))
+	print model.output_shape
+	assert(model.output_shape == (None, PARAM_SIZE))
+
+	model.add(Reshape((PARAM_SIZE, 1, 1), name='encoder'))
+	print model.output_shape
+
+	model.add(Conv2DTranspose(256, (4, 1)))           #(4, 1)
+	model.add(Activation("relu"))
+	print model.output_shape
+
+	model.add(Conv2DTranspose(256, 4))                #(7, 4)
+	model.add(Activation("relu"))
+	print model.output_shape
+
+	model.add(Conv2DTranspose(256, 4))                #(10, 7)
+	model.add(Activation("relu"))
+	print model.output_shape
+
+	model.add(Conv2DTranspose(256, 4, strides=2))     #(22, 16)
+	model.add(Activation("relu"))
+	print model.output_shape
+
+	model.add(Conv2DTranspose(128, 4, strides=2))     #(46, 34)
+	model.add(Activation("relu"))
+	print model.output_shape
+
+	model.add(Conv2DTranspose(128, 4, strides=2))     #(94, 70)
+	model.add(Activation("relu"))
+	print model.output_shape
+
+	model.add(Conv2DTranspose(3, 6, strides=2))      #(192, 144)
+	model.add(Activation("sigmoid"))
+	print model.output_shape
+	assert(model.output_shape[1:] == (3, 192, 144))
+
+	model.compile(optimizer=Adam(lr=LR), loss='mse')
+	plot_model(model, to_file='model.png', show_shapes=True)
+
+###################################
+#  Encoder / Decoder
+###################################
+print "Compiling SubModels..."
+func = K.function([model.get_layer('encoder').input, K.learning_phase()],
+				  [model.layers[-1].output])
+enc_model = Model(inputs=model.input,
+                  outputs=model.get_layer('pre_encoder').output)
+
+rand_vecs = np.random.normal(0.0, 1.0, (NUM_RAND_FACES, PARAM_SIZE))
+
+def make_rand_faces(rand_vecs, iters):
+	x_enc = enc_model.predict(x_train, batch_size=BATCH_SIZE)
+
+	x_mean = np.mean(x_enc, axis=0)
+	x_stds = np.std(x_enc, axis=0)
+	x_cov = np.cov((x_enc - x_mean).T)
+	e, v = np.linalg.eig(x_cov)
+
+	np.save('means.npy', x_mean)
+	np.save('stds.npy', x_stds)
+	np.save('evals.npy', e)
+	np.save('evecs.npy', v)
+
+	e_list = e.tolist()
+	e_list.sort(reverse=True)
+	plt.clf()
+	plt.bar(np.arange(e.shape[0]), e_list, align='center')
+	plt.draw()
+	plt.savefig('evals.png')
+
+	x_vecs = x_mean + np.dot(v, (rand_vecs * e).T).T
+	y_faces = func([x_vecs, 0])[0]
+	for i in xrange(y_faces.shape[0]):
+		save_image(y_faces[i], 'rand' + str(i) + '.png')
+		if i < 5 and (iters % 10) == 0:
+			if not os.path.exists('morph' + str(i)):
+				os.makedirs('morph' + str(i))
+			save_image(y_faces[i], 'morph' + str(i) + '/img' + str(iters) + '.png')
+
+make_rand_faces(rand_vecs, 0)
+
+###################################
+#  Train
+###################################
+print "Training..."
+train_loss = []
+
+for iters in xrange(NUM_EPOCHS):
+	history = model.fit(x_train, y_train, batch_size=BATCH_SIZE, epochs=1)
+
+	loss = history.history['loss'][-1]
+	train_loss.append(loss)
+	print "Loss: " + str(loss)
+
+	plotScores(train_loss, [], 'EncoderScores.png', True)
+
+	if iters % 20 == 0:
+		model.save('Encoder.h5')
+
+		y_faces = model.predict(x_train[:NUM_TEST_FACES], batch_size=BATCH_SIZE)
+		for i in xrange(y_faces.shape[0]):
+			save_image(y_faces[i], 'gt' + str(i) + '.png')
+
+		make_rand_faces(rand_vecs, iters)
+
+		print "Saved"
+
+print "Done"