In [1]:
import os
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from PIL import Image

import torch
import torchvision
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F
from torchvision import transforms, utils
import random
from torchvision.transforms import Resize, ToTensor, Normalize
from torch.utils.data import Dataset, DataLoader, random_split, SubsetRandomSampler, WeightedRandomSampler

In [2]:
def seed_everything(seed):
    """
    동일한 조건으로 학습을 할 때, 동일한 결과를 얻기 위해 seed를 고정시킵니다.
    
    Args:
        seed: seed 정수값
    """
    torch.manual_seed(seed) # pytorch의 random seed 고정
    torch.cuda.manual_seed(seed) # GPU 에서 사용하는 난수 생성 시드 고정
    # torch.cuda.manual_seed_all(seed)  # if use multi-GPU
    torch.backends.cudnn.deterministic = True # CuDNN 부분고정
    torch.backends.cudnn.benchmark = False # CuDNN 부분고정
    np.random.seed(seed) # Numpy 부분
    random.seed(seed) # transforms에서 random 라이브러리를 사용하기 때문에 random 라이브러리를 불러서 고정

seed_everything(42)

In [None]:
# from zipfile import ZipFile

# file_name = "zipfiles/scenery.zip"

# with ZipFile(file_name, 'r') as zip:
#     zip.extractall("scenery") 
#     print('File is unzipped in vector folder')

In [3]:
def search(dirname, result):  # 하위목록의 모든 파일을 찾는 함수
    try:
        filenames = os.listdir(dirname)
        for filename in filenames:
            full_filename = os.path.join(dirname, filename)
            if os.path.isdir(full_filename):
                search(full_filename, result)
            else:
                ext = os.path.splitext(full_filename)[-1]  # 확장자 체크
                if ext:
                    result.append(full_filename)
    except PermissionError:
        pass

scenery_all_path = []
search("scenery", scenery_all_path)
vector_all_path = []
search("vector", vector_all_path)

In [4]:
len(scenery_all_path), len(vector_all_path)

(22125, 14876)

In [5]:
vector_all_path[:5]

['vector/moped-153275__340.png',
 'vector/cake-305217__340.png',
 'vector/bird-1296169__480.png',
 'vector/lady-2860835__340.png',
 'vector/bush-575517__340.png']

In [6]:
def labeling(dirname, result, prefix):  # 라벨링하는 함수
    try:
        filenames = os.listdir(dirname)
        for filename in filenames:
            keyword = prefix + filename.split(".")[0].split("__")[0].split("-")[0]
            result.append(keyword)
    except PermissionError:
        pass

In [7]:
dirname, vector_label = "vector", []
labeling(dirname, vector_label, "a vector image of ")
dirname, scenery_label = "scenery", []
labeling(dirname, scenery_label, "a scenery of ")

In [8]:
len(vector_label), len(scenery_label)

(14876, 22125)

In [9]:
scenery_df = pd.DataFrame(scenery_all_path, columns = ['path'])

scenery_df['label'] = scenery_label
scenery_df

Unnamed: 0,path,label
0,scenery/tea-garden-2823303__340.png,a scenery of tea
1,scenery/grain-field-6571349__340.png,a scenery of grain
2,scenery/santa-barbara-1584103__340.png,a scenery of santa
3,scenery/field-6772703__340.png,a scenery of field
4,scenery/cow-4960242__340.png,a scenery of cow
...,...,...
22120,scenery/tajikistan-4582152__340.png,a scenery of tajikistan
22121,scenery/river-6748978__340.png,a scenery of river
22122,scenery/mountains-5729187__340.png,a scenery of mountains
22123,scenery/spoon-bills-5791480__340.png,a scenery of spoon


In [10]:
vector_df = pd.DataFrame(vector_all_path, columns = ['path'])

vector_df['label'] = vector_label
vector_df

Unnamed: 0,path,label
0,vector/moped-153275__340.png,a vector image of moped
1,vector/cake-305217__340.png,a vector image of cake
2,vector/bird-1296169__480.png,a vector image of bird
3,vector/lady-2860835__340.png,a vector image of lady
4,vector/bush-575517__340.png,a vector image of bush
...,...,...
14871,vector/sos-2753818__340.png,a vector image of sos
14872,vector/silhouette-1229849__340.png,a vector image of silhouette
14873,vector/dove-7100089__340.png,a vector image of dove
14874,vector/couple-2029712__340.png,a vector image of couple


In [11]:
df = pd.concat([vector_df, scenery_df], ignore_index=True)
df

Unnamed: 0,path,label
0,vector/moped-153275__340.png,a vector image of moped
1,vector/cake-305217__340.png,a vector image of cake
2,vector/bird-1296169__480.png,a vector image of bird
3,vector/lady-2860835__340.png,a vector image of lady
4,vector/bush-575517__340.png,a vector image of bush
...,...,...
36996,scenery/tajikistan-4582152__340.png,a scenery of tajikistan
36997,scenery/river-6748978__340.png,a scenery of river
36998,scenery/mountains-5729187__340.png,a scenery of mountains
36999,scenery/spoon-bills-5791480__340.png,a scenery of spoon


In [12]:
normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406],
                                 std=[0.229, 0.224, 0.225])

data_transforms = {
    'train':
    transforms.Compose([
        transforms.Resize((224,224)),
        transforms.ToTensor(),
        normalize
    ]),
    'val':
    transforms.Compose([
        transforms.Resize((224,224)),
        transforms.ToTensor(),
        normalize
    ]),
}

In [13]:
class CustomDataset(Dataset):
    def __init__(self, img_paths_label, transform):
        self.X = img_paths_label['path']
        self.y = img_paths_label['label']
        self.transform = transform
    
    def __getitem__(self, index):
        # image = Image.open(self.X.iloc[index])
        image = Image.open(self.X.iloc[index]).convert('RGB')
        label = self.y.iloc[index]
        
        if self.transform:
            image = self.transform(image)
        # return image, torch.tensor(label)
        return image, label
    
    def __len__(self):
        return len(self.X)

In [15]:
from sklearn.model_selection import train_test_split

train, valid = train_test_split(df, test_size=0.2,
                               shuffle=True,
                               random_state=42)

In [16]:
BATCH_SIZE = 32

train_dataset = CustomDataset(train, data_transforms['train'])
train_dataloader = DataLoader(train_dataset,
                             batch_size = BATCH_SIZE,
                             shuffle=True)

valid_dataset = CustomDataset(valid, data_transforms['val'])
valid_dataloader = DataLoader(valid_dataset,
                             batch_size=BATCH_SIZE,
                             shuffle=True)

In [18]:
next(iter(train_dataloader))[0]

tensor([[[[-1.1418, -1.2959, -1.3302,  ..., -0.8678, -0.9705, -0.8164],
          [-0.9877, -1.1760, -1.2959,  ..., -0.9705, -1.1247, -1.0219],
          [-1.1247, -1.2103, -1.2445,  ..., -1.1075, -1.1932, -1.1075],
          ...,
          [-0.7650, -0.7650, -0.6965,  ...,  0.0398,  0.0398, -0.0458],
          [-0.6623, -0.6452, -0.6109,  ..., -0.0629, -0.0116,  0.0056],
          [-0.6109, -0.6109, -0.5938,  ..., -0.0458,  0.0227, -0.0287]],

         [[-0.7752, -0.9328, -0.9503,  ..., -0.5651, -0.6527, -0.5126],
          [-0.6352, -0.8102, -0.9153,  ..., -0.6527, -0.7927, -0.6877],
          [-0.7402, -0.8277, -0.8452,  ..., -0.7577, -0.8452, -0.7752],
          ...,
          [-0.9153, -0.9153, -0.8803,  ..., -0.4776, -0.4776, -0.5476],
          [-0.8627, -0.8452, -0.8277,  ..., -0.5826, -0.5301, -0.5126],
          [-0.8102, -0.8102, -0.8102,  ..., -0.5651, -0.4951, -0.5476]],

         [[-0.0790, -0.2184, -0.2184,  ..., -0.5321, -0.6541, -0.5147],
          [ 0.0256, -0.1487, -

In [19]:
next(iter(train_dataloader))[0].shape

torch.Size([32, 3, 224, 224])

* 간혹 `unidentifiedimageerror: cannot identify image file` 에러 발생

In [20]:
import importlib

def get_obj_from_str(string, reload=False):
    module, cls = string.rsplit(".", 1)
    if reload:
        module_imp = importlib.import_module(module)
        importlib.reload(module_imp)
    return getattr(importlib.import_module(module, package=None), cls)

def instantiate_from_config(config):
    if not "target" in config:
        if config == '__is_first_stage__':
            return None
        elif config == "__is_unconditional__":
            return None
        raise KeyError("Expected key `target` to instantiate.")
    return get_obj_from_str(config["target"])(**config.get("params", dict()))

def load_model_from_config(config, ckpt):
    print(f"Loading model from {ckpt}")
    pl_sd = torch.load(ckpt)#, map_location="cpu")
    sd = pl_sd["state_dict"]
    model = instantiate_from_config(config.model)
    m, u = model.load_state_dict(sd, strict=False)
    model.cuda()
    model.eval()
    return model

In [21]:
from omegaconf import OmegaConf

def get_model():
    config = OmegaConf.load("../configs/latent-diffusion/txt2img-1p4B-eval.yaml")  # TODO: Optionally download from same location as ckpt and chnage this logic
    model = load_model_from_config(config, "../models/ldm/text2img-large/model.ckpt")  # TODO: check path
    return model

In [None]:
# !pip install pytorch_lightning

In [22]:
import sys
sys.path

['/opt/ml/latent-diffusion/scripts',
 '/opt/conda/envs/ldm/lib/python38.zip',
 '/opt/conda/envs/ldm/lib/python3.8',
 '/opt/conda/envs/ldm/lib/python3.8/lib-dynload',
 '',
 '/opt/conda/envs/ldm/lib/python3.8/site-packages',
 '/opt/ml/latent-diffusion/src/taming-transformers',
 '/opt/ml/latent-diffusion',
 '/opt/ml/latent-diffusion/src/clip']

In [None]:
# sys.path.append('/opt/ml/latent-diffusion')

In [None]:
# sys.path

['/opt/ml/latent-diffusion/scripts',
 '/opt/conda/lib/python38.zip',
 '/opt/conda/lib/python3.8',
 '/opt/conda/lib/python3.8/lib-dynload',
 '',
 '/opt/conda/lib/python3.8/site-packages',
 '/opt/conda/lib/python3.8/site-packages/IPython/extensions',
 '/opt/ml/.ipython',
 '/opt/ml/latent-diffusion']

In [23]:
model = get_model()

Loading model from ../models/ldm/text2img-large/model.ckpt
LatentDiffusion: Running in eps-prediction mode
DiffusionWrapper has 872.30 M params.
making attention of type 'vanilla' with 512 in_channels
Working with z of shape (1, 4, 32, 32) = 4096 dimensions.
making attention of type 'vanilla' with 512 in_channels
