In [None]:
# mount drive first
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [None]:
# Link to drive with images for reference
# https://drive.google.com/drive/folders/1WIZB_ZLItOE0XkjQg2FsLZIuoSnIcYQp
!apt-get install -y p7zip-full
DRIVE_ZIP_PATH_1 = '/content/drive/MyDrive/Colab Notebooks/RevealAI/48K First Sample/test.7z'
DRIVE_ZIP_PATH_2 = '/content/drive/MyDrive/Colab Notebooks/RevealAI/48K First Sample/train.7z'
DRIVE_ZIP_PATH_3 = '/content/drive/MyDrive/Colab Notebooks/RevealAI/48K First Sample/validation.7z'


# # Local temporary disk destination
LOCAL_DESTINATION = '/content/'

# # Execute the copy command

!cp "{DRIVE_ZIP_PATH_1}" "{LOCAL_DESTINATION}"
!cp "{DRIVE_ZIP_PATH_2}" "{LOCAL_DESTINATION}"
!cp "{DRIVE_ZIP_PATH_3}" "{LOCAL_DESTINATION}"

print(f" Copied data to local Colab disk.")
# # Path to the ZIP file on the local disk

LOCAL_ZIP_PATH_1 = '/content/test.7z'
LOCAL_ZIP_PATH_2 = '/content/train.7z'
LOCAL_ZIP_PATH_3 = '/content/validation.7z'

# # Execute the unzip command
# # -q: quiet (less terminal output)
# # -d /content/: extract contents to the /content/ directory

!7z x "{LOCAL_ZIP_PATH_1}" -o/content/
!7z x "{LOCAL_ZIP_PATH_2}" -o/content/
!7z x "{LOCAL_ZIP_PATH_3}" -o/content/
print(" Unzipping complete! Your data is now fast to access.")

Reading package lists... Done
Building dependency tree... Done
Reading state information... Done
p7zip-full is already the newest version (16.02+dfsg-8).
0 upgraded, 0 newly installed, 0 to remove and 41 not upgraded.
 Copied data to local Colab disk.

7-Zip [64] 16.02 : Copyright (c) 1999-2016 Igor Pavlov : 2016-05-21
p7zip Version 16.02 (locale=en_US.UTF-8,Utf16=on,HugeFiles=on,64 bits,2 CPUs Intel(R) Xeon(R) CPU @ 2.20GHz (406F0),ASM,AES-NI)

Scanning the drive for archives:
  0M Scan /content/                   1 file, 714238854 bytes (682 MiB)

Extracting archive: /content/test.7z
--
Path = /content/test.7z
Type = 7z
Physical Size = 714238854
Headers Size = 103910
Method = LZMA:23
Solid = +
Blocks = 1

  0%      0% - test/ai/000_biggan_00130.jpg                                     0% 50 - test/ai/054_biggan_00066.jpg             

In [None]:
# u have to get ride of the empty files or the model wont run
import os
from PIL import Image

folders = [
    "/content/train/ai",
    "/content/train/real",
    "/content/test/ai",
    "/content/test/real",
    "/content/validation/ai",
    "/content/validation/real"
]

count_removed = 0
for folder in folders:
  for f in os.listdir(folder):
    path = os.path.join(folder, f)
    if os.path.isfile(path) and f.lower().endswith(('.jpg', '.jpeg')):
        if os.path.getsize(path) == 0:
            os.remove(path)
            count_removed += 1
            # print(f"Deleted empty file: {path}")
print('Count of deleted files : ', count_removed)


In [None]:

folders = [
    "/content/train/ai",
    "/content/train/real",
    "/content/test/ai",
    "/content/test/real",
    "/content/validation/ai",
    "/content/validation/real"
]

ai = {'r':0,'g':0,'b':0}
real = {'r':0,'g':0,'b':0}

for folder in folders:
  if 'ai' in folder:
    for f in os.listdir(folder):
      path = os.path.join(folder, f)
      if os.path.isfile(path) and f.lower().endswith(('.jpg', '.jpeg')):
        img = None
        # print( path)
        try:
            img = Image.open(path).convert("RGB")
        except:
            pass
        colors = img.getcolors(maxcolors=img.width * img.height)
        if colors is not None:
            for count, (r,g,b) in colors:
              ai['r'] += r * count
              ai['g'] += g * count
              ai['b'] += b * count
total = sum(ai.values())
ai['r'] = (ai['r'] / total) * 100
ai['g'] = (ai['g'] / total) * 100
ai['b'] = (ai['b'] / total) * 100
print('AI Folders color composition : ', ai)

AI Folders color composition :  {'r': 36.015429747312616, 'g': 33.88881971328638, 'b': 30.095750539401}


In [None]:

real = {'r':0,'g':0,'b':0}

for folder in folders:
  if 'real' in folder:
    for f in os.listdir(folder):
      path = os.path.join(folder, f)
      if os.path.isfile(path) and f.lower().endswith(('.jpg', '.jpeg')):
        img = None
        # print( path)
        try:
            img = Image.open(path).convert("RGB")
        except:
            pass
        colors = img.getcolors(maxcolors=img.width * img.height)
        if colors is not None:
            for count, (r,g,b) in colors:
              real['r'] += r * count
              real['g'] += g * count
              real['b'] += b * count
total = sum(real.values())
real['r'] = (real['r'] / total) * 100
real['g'] = (real['g'] / total) * 100
real['b'] = (real['b'] / total) * 100
print('Real Folders color composition : ', real)


Real Folders color composition :  {'r': 35.79577421065303, 'g': 33.94757750335207, 'b': 30.256648285994896}


In [None]:


import numpy as np



ai = {'r':0,'g':0,'b':0}
real = {'r':0,'g':0,'b':0}
data_brightness = []
data_contrast = []
for folder in folders:
  if 'ai' in folder:
    for f in os.listdir(folder):
      path = os.path.join(folder, f)
      if os.path.isfile(path) and f.lower().endswith(('.jpg', '.jpeg')):
        img = None
        # print( path)
        try:
            img = Image.open(path).convert("RGB")
        except:
            pass
        data_brightness.append(float(np.array(img.convert('L')).mean()))
        data_contrast.append(float(np.array(img.convert('L')).std()))
print(np.mean(data_brightness))
print(np.mean(data_contrast))




In [None]:


import numpy as np



ai = {'r':0,'g':0,'b':0}
real = {'r':0,'g':0,'b':0}
data_brightness = []
data_contrast = []
for folder in folders:
  if 'real' in folder:
    for f in os.listdir(folder):
      path = os.path.join(folder, f)
      if os.path.isfile(path) and f.lower().endswith(('.jpg', '.jpeg')):
        img = None
        # print( path)
        try:
            img = Image.open(path).convert("RGB")
        except:
            pass
        data_brightness.append(float(np.array(img.convert('L')).mean()))
        data_contrast.append(float(np.array(img.convert('L')).std()))
print(np.mean(data_brightness))
print(np.mean(data_contrast))




117.13086237129887
57.50405576616695
