In [None]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [None]:
from pycocotools.coco import COCO # Common Object in Context
import numpy as np
import cv2
import os
from tqdm import tqdm

# base path
base_path = r'/content/drive/MyDrive/AI_Vision_Extract_Nov25/data/COCO2017_SAMPLE'

# Create output directory with FULL PATH
masks_output_dir = os.path.join(base_path, 'mask_val2017')
os.makedirs(masks_output_dir, exist_ok=True)

print(f"Saving masks to: {masks_output_dir}")

# Load val annotations
annotations_path = os.path.join(base_path, '/content/drive/MyDrive/AI_Vision_Extract_Nov25/data/annotations/captions_train2017.json')
coco = COCO(annotations_path)
img_ids = coco.getImgIds()

print(f"Total val images: {len(img_ids)}")

# Create masks for val images
for img_id in tqdm(img_ids, desc='Creating val masks'):
   try:
     img_info = coco.loadImgs(img_id)[0]
     ann_ids = coco.getAnnIds(imgIds=img_id)
     anns = coco.loadAnns(ann_ids)

     # Create binary mask
     mask = np.zeros((img_info['height'], img_info['width']), dtype = np.uint8)

     for ann in  anns:
        mask += coco.annToMask(ann)
     # Binary conversion (0 or 255)
     mask = (mask > 0).astype(np.uint8) * 255

     # Save with matching filename using ABSOLUTE PATH
     mask_filename = img_info(['file_name']).replace('.jpg', '_mask.png')
     mask_path = os.path.join(masks_output_dir, mask_filename)
     cv2.inwrite(mask_path, mask)
   except Exception as e:
     print(f"Error processing image {img_id}: {str(e)}")

print("✓ Training masks created successfully!")

# Verify masks were created
mask_count = len(os.listdir(masks_output_dir))
print(f"✓ Verified: {mask_count} mask files created in {masks_output_dir}")


Saving masks to: /content/drive/MyDrive/AI_Vision_Extract_Nov25/data/COCO2017_SAMPLE/mask_val2017
loading annotations into memory...
Done (t=3.89s)
creating index...
index created!
Total val images: 118287


Creating val masks:   4%|▍         | 4840/118287 [00:00<00:02, 48393.47it/s]

[1;30;43mStreaming output truncated to the last 5000 lines.[0m
Error processing image 187177: 'segmentation'
Error processing image 403349: 'segmentation'
Error processing image 124873: 'segmentation'
Error processing image 468162: 'segmentation'
Error processing image 34892: 'segmentation'
Error processing image 544071: 'segmentation'
Error processing image 12966: 'segmentation'
Error processing image 357356: 'segmentation'
Error processing image 142940: 'segmentation'
Error processing image 548331: 'segmentation'
Error processing image 462241: 'segmentation'
Error processing image 442565: 'segmentation'
Error processing image 78838: 'segmentation'
Error processing image 91474: 'segmentation'
Error processing image 200720: 'segmentation'
Error processing image 430652: 'segmentation'
Error processing image 569070: 'segmentation'
Error processing image 344314: 'segmentation'
Error processing image 243331: 'segmentation'
Error processing image 440895: 'segmentation'
Error processing im

Creating val masks:  12%|█▏        | 14050/118287 [00:00<00:02, 42853.47it/s]

[1;30;43mStreaming output truncated to the last 5000 lines.[0m
Error processing image 426101: 'segmentation'
Error processing image 328818: 'segmentation'
Error processing image 16164: 'segmentation'
Error processing image 154363: 'segmentation'
Error processing image 443281: 'segmentation'
Error processing image 464176: 'segmentation'
Error processing image 470348: 'segmentation'
Error processing image 66879: 'segmentation'
Error processing image 390583: 'segmentation'
Error processing image 418854: 'segmentation'
Error processing image 30254: 'segmentation'
Error processing image 104751: 'segmentation'
Error processing image 185633: 'segmentation'
Error processing image 159151: 'segmentation'
Error processing image 482297: 'segmentation'
Error processing image 476313: 'segmentation'
Error processing image 345401: 'segmentation'
Error processing image 141197: 'segmentation'
Error processing image 235964: 'segmentation'
Error processing image 271206: 'segmentation'
Error processing i

Creating val masks:  19%|█▉        | 22750/118287 [00:00<00:02, 43113.14it/s]

[1;30;43mStreaming output truncated to the last 5000 lines.[0m
Error processing image 364911: 'segmentation'
Error processing image 558388: 'segmentation'
Error processing image 69757: 'segmentation'
Error processing image 76431: 'segmentation'
Error processing image 382288: 'segmentation'
Error processing image 105011: 'segmentation'
Error processing image 208817: 'segmentation'
Error processing image 468337: 'segmentation'
Error processing image 124416: 'segmentation'
Error processing image 238980: 'segmentation'
Error processing image 92776: 'segmentation'
Error processing image 574250: 'segmentation'
Error processing image 128756: 'segmentation'
Error processing image 246686: 'segmentation'
Error processing image 305962: 'segmentation'
Error processing image 403975: 'segmentation'
Error processing image 60213: 'segmentation'
Error processing image 235319: 'segmentation'
Error processing image 287636: 'segmentation'
Error processing image 75434: 'segmentation'
Error processing ima

Creating val masks:  27%|██▋       | 31365/118287 [00:00<00:02, 42761.39it/s]

[1;30;43mStreaming output truncated to the last 5000 lines.[0m
Error processing image 556341: 'segmentation'
Error processing image 502163: 'segmentation'
Error processing image 320396: 'segmentation'
Error processing image 190950: 'segmentation'
Error processing image 416193: 'segmentation'
Error processing image 315577: 'segmentation'
Error processing image 546792: 'segmentation'
Error processing image 65430: 'segmentation'
Error processing image 109907: 'segmentation'
Error processing image 482021: 'segmentation'
Error processing image 252008: 'segmentation'
Error processing image 161144: 'segmentation'
Error processing image 230585: 'segmentation'
Error processing image 565903: 'segmentation'
Error processing image 424392: 'segmentation'
Error processing image 48268: 'segmentation'
Error processing image 324338: 'segmentation'
Error processing image 442536: 'segmentation'
Error processing image 576045: 'segmentation'
Error processing image 539453: 'segmentation'
Error processing 

Creating val masks:  34%|███▍      | 40133/118287 [00:00<00:01, 41843.10it/s]

[1;30;43mStreaming output truncated to the last 5000 lines.[0m
Error processing image 62246: 'segmentation'
Error processing image 41434: 'segmentation'
Error processing image 263515: 'segmentation'
Error processing image 552646: 'segmentation'
Error processing image 130324: 'segmentation'
Error processing image 309983: 'segmentation'
Error processing image 220860: 'segmentation'
Error processing image 113216: 'segmentation'
Error processing image 315728: 'segmentation'
Error processing image 249451: 'segmentation'
Error processing image 482195: 'segmentation'
Error processing image 271195: 'segmentation'
Error processing image 470975: 'segmentation'
Error processing image 74403: 'segmentation'
Error processing image 382979: 'segmentation'
Error processing image 216072: 'segmentation'
Error processing image 521570: 'segmentation'
Error processing image 159309: 'segmentation'
Error processing image 558129: 'segmentation'
Error processing image 362131: 'segmentation'
Error processing i

Creating val masks:  41%|████      | 48455/118287 [00:01<00:01, 40856.65it/s]

[1;30;43mStreaming output truncated to the last 5000 lines.[0m
Error processing image 65900: 'segmentation'
Error processing image 210612: 'segmentation'
Error processing image 73035: 'segmentation'
Error processing image 150773: 'segmentation'
Error processing image 456345: 'segmentation'
Error processing image 44954: 'segmentation'
Error processing image 227941: 'segmentation'
Error processing image 579260: 'segmentation'
Error processing image 236938: 'segmentation'
Error processing image 52281: 'segmentation'
Error processing image 295740: 'segmentation'
Error processing image 456800: 'segmentation'
Error processing image 26310: 'segmentation'
Error processing image 264436: 'segmentation'
Error processing image 68242: 'segmentation'
Error processing image 479621: 'segmentation'
Error processing image 538581: 'segmentation'
Error processing image 462353: 'segmentation'
Error processing image 466305: 'segmentation'
Error processing image 341121: 'segmentation'
Error processing imag

Creating val masks:  48%|████▊     | 56833/118287 [00:01<00:01, 39605.54it/s]

[1;30;43mStreaming output truncated to the last 5000 lines.[0m
Error processing image 531459: 'segmentation'
Error processing image 547637: 'segmentation'
Error processing image 237762: 'segmentation'
Error processing image 244428: 'segmentation'
Error processing image 199619: 'segmentation'
Error processing image 411750: 'segmentation'
Error processing image 415222: 'segmentation'
Error processing image 306722: 'segmentation'
Error processing image 418985: 'segmentation'
Error processing image 268122: 'segmentation'
Error processing image 510596: 'segmentation'
Error processing image 88287: 'segmentation'
Error processing image 463285: 'segmentation'
Error processing image 160837: 'segmentation'
Error processing image 217925: 'segmentation'
Error processing image 175038: 'segmentation'
Error processing image 381330: 'segmentation'
Error processing image 165654: 'segmentation'
Error processing image 264320: 'segmentation'
Error processing image 133517: 'segmentation'
Error processing

Creating val masks:  55%|█████▍    | 64841/118287 [00:01<00:01, 39153.19it/s]

[1;30;43mStreaming output truncated to the last 5000 lines.[0m
Error processing image 529238: 'segmentation'
Error processing image 203040: 'segmentation'
Error processing image 109561: 'segmentation'
Error processing image 292921: 'segmentation'
Error processing image 86294: 'segmentation'
Error processing image 476761: 'segmentation'
Error processing image 536509: 'segmentation'
Error processing image 344361: 'segmentation'
Error processing image 252608: 'segmentation'
Error processing image 455198: 'segmentation'
Error processing image 2754: 'segmentation'
Error processing image 450672: 'segmentation'
Error processing image 380171: 'segmentation'
Error processing image 229603: 'segmentation'
Error processing image 169360: 'segmentation'
Error processing image 488244: 'segmentation'
Error processing image 544035: 'segmentation'
Error processing image 316649: 'segmentation'
Error processing image 439946: 'segmentation'
Error processing image 561527: 'segmentation'
Error processing i

Creating val masks:  62%|██████▏   | 73016/118287 [00:01<00:01, 38931.74it/s]

Error processing image 281745: 'segmentation'
Error processing image 449350: 'segmentation'
Error processing image 510977: 'segmentation'
Error processing image 574839: 'segmentation'
Error processing image 142413: 'segmentation'
Error processing image 241945: 'segmentation'
Error processing image 63248: 'segmentation'
Error processing image 105293: 'segmentation'
Error processing image 49554: 'segmentation'
Error processing image 536103: 'segmentation'
Error processing image 502911: 'segmentation'
Error processing image 221474: 'segmentation'
Error processing image 108217: 'segmentation'
Error processing image 397527: 'segmentation'
Error processing image 239350: 'segmentation'
Error processing image 381922: 'segmentation'
Error processing image 553640: 'segmentation'
Error processing image 229654: 'segmentation'
Error processing image 25377: 'segmentation'
Error processing image 432119: 'segmentation'
Error processing image 471596: 'segmentation'
Error processing image 376153: 'segme

Creating val masks:  69%|██████▉   | 81519/118287 [00:02<00:00, 40223.83it/s]

Error processing image 103510: 'segmentation'
Error processing image 302278: 'segmentation'
Error processing image 515512: 'segmentation'
Error processing image 19250: 'segmentation'
Error processing image 304332: 'segmentation'
Error processing image 327468: 'segmentation'
Error processing image 245230: 'segmentation'
Error processing image 57491: 'segmentation'
Error processing image 509654: 'segmentation'
Error processing image 409754: 'segmentation'
Error processing image 550140: 'segmentation'
Error processing image 336497: 'segmentation'
Error processing image 510571: 'segmentation'
Error processing image 578497: 'segmentation'
Error processing image 259551: 'segmentation'
Error processing image 107052: 'segmentation'
Error processing image 130816: 'segmentation'
Error processing image 310317: 'segmentation'
Error processing image 269958: 'segmentation'
Error processing image 36187: 'segmentation'
Error processing image 203545: 'segmentation'
Error processing image 40474: 'segmen

Creating val masks:  76%|███████▌  | 89438/118287 [00:02<00:00, 38267.13it/s]

Error processing image 47526: 'segmentation'
Error processing image 460448: 'segmentation'
Error processing image 550745: 'segmentation'
Error processing image 579968: 'segmentation'
Error processing image 164224: 'segmentation'
Error processing image 130625: 'segmentation'
Error processing image 23588: 'segmentation'
Error processing image 496386: 'segmentation'
Error processing image 88663: 'segmentation'
Error processing image 520610: 'segmentation'
Error processing image 246470: 'segmentation'
Error processing image 228732: 'segmentation'
Error processing image 236626: 'segmentation'
Error processing image 545145: 'segmentation'
Error processing image 177289: 'segmentation'
Error processing image 95241: 'segmentation'
Error processing image 290676: 'segmentation'
Error processing image 297898: 'segmentation'
Error processing image 369202: 'segmentation'
Error processing image 580523: 'segmentation'
Error processing image 358172: 'segmentation'
Error processing image 278204: 'segmen

Creating val masks:  79%|███████▉  | 93285/118287 [00:02<00:00, 37025.14it/s]

Error processing image 175357: 'segmentation'
Error processing image 345104: 'segmentation'
Error processing image 232434: 'segmentation'
Error processing image 533835: 'segmentation'
Error processing image 73189: 'segmentation'
Error processing image 69432: 'segmentation'
Error processing image 340699: 'segmentation'
Error processing image 197661: 'segmentation'
Error processing image 14375: 'segmentation'
Error processing image 407698: 'segmentation'
Error processing image 174735: 'segmentation'
Error processing image 84211: 'segmentation'
Error processing image 295505: 'segmentation'
Error processing image 422336: 'segmentation'
Error processing image 216322: 'segmentation'
Error processing image 460737: 'segmentation'
Error processing image 293174: 'segmentation'
Error processing image 427163: 'segmentation'
Error processing image 320643: 'segmentation'
Error processing image 156739: 'segmentation'
Error processing image 468241: 'segmentation'
Error processing image 23249: 'segment

Creating val masks:  85%|████████▍ | 100491/118287 [00:02<00:00, 34455.54it/s]

Error processing image 432892: 'segmentation'
Error processing image 335174: 'segmentation'
Error processing image 172827: 'segmentation'
Error processing image 127229: 'segmentation'
Error processing image 233877: 'segmentation'
Error processing image 208250: 'segmentation'
Error processing image 530364: 'segmentation'
Error processing image 208880: 'segmentation'
Error processing image 467206: 'segmentation'
Error processing image 110704: 'segmentation'
Error processing image 200611: 'segmentation'
Error processing image 198323: 'segmentation'
Error processing image 387895: 'segmentation'
Error processing image 507952: 'segmentation'
Error processing image 238654: 'segmentation'
Error processing image 141236: 'segmentation'
Error processing image 52448: 'segmentation'
Error processing image 380455: 'segmentation'
Error processing image 494986: 'segmentation'
Error processing image 506232: 'segmentation'
Error processing image 571366: 'segmentation'
Error processing image 212401: 'seg

Creating val masks:  91%|█████████ | 107622/118287 [00:02<00:00, 35061.13it/s]

Error processing image 432908: 'segmentation'
Error processing image 87214: 'segmentation'
Error processing image 556643: 'segmentation'
Error processing image 191945: 'segmentation'
Error processing image 528621: 'segmentation'
Error processing image 411751: 'segmentation'
Error processing image 205011: 'segmentation'
Error processing image 444086: 'segmentation'
Error processing image 275211: 'segmentation'
Error processing image 196290: 'segmentation'
Error processing image 173324: 'segmentation'
Error processing image 395304: 'segmentation'
Error processing image 525212: 'segmentation'
Error processing image 173893: 'segmentation'
Error processing image 156512: 'segmentation'
Error processing image 580600: 'segmentation'
Error processing image 96713: 'segmentation'
Error processing image 117360: 'segmentation'
Error processing image 146926: 'segmentation'
Error processing image 541531: 'segmentation'
Error processing image 8186: 'segmentation'
Error processing image 111425: 'segmen

Creating val masks:  97%|█████████▋| 114777/118287 [00:02<00:00, 35178.59it/s]

Error processing image 150797: 'segmentation'
Error processing image 471132: 'segmentation'
Error processing image 172543: 'segmentation'
Error processing image 412566: 'segmentation'
Error processing image 143958: 'segmentation'
Error processing image 88267: 'segmentation'
Error processing image 298350: 'segmentation'
Error processing image 95633: 'segmentation'
Error processing image 313494: 'segmentation'
Error processing image 556363: 'segmentation'
Error processing image 306902: 'segmentation'
Error processing image 436984: 'segmentation'
Error processing image 555583: 'segmentation'
Error processing image 287117: 'segmentation'
Error processing image 145452: 'segmentation'
Error processing image 13800: 'segmentation'
Error processing image 208857: 'segmentation'
Error processing image 123208: 'segmentation'
Error processing image 27920: 'segmentation'
Error processing image 132422: 'segmentation'
Error processing image 289140: 'segmentation'
Error processing image 252905: 'segmen

Creating val masks: 100%|██████████| 118287/118287 [00:03<00:00, 38482.75it/s]

Error processing image 565201: 'segmentation'
Error processing image 121792: 'segmentation'
Error processing image 370728: 'segmentation'
Error processing image 556599: 'segmentation'
Error processing image 168296: 'segmentation'
Error processing image 545257: 'segmentation'
Error processing image 250909: 'segmentation'
Error processing image 120230: 'segmentation'
Error processing image 250958: 'segmentation'
Error processing image 88870: 'segmentation'
Error processing image 45230: 'segmentation'
Error processing image 284448: 'segmentation'
Error processing image 288683: 'segmentation'
Error processing image 186155: 'segmentation'
Error processing image 359360: 'segmentation'
Error processing image 130069: 'segmentation'
Error processing image 580434: 'segmentation'
Error processing image 404750: 'segmentation'
Error processing image 131127: 'segmentation'
Error processing image 467645: 'segmentation'
Error processing image 124132: 'segmentation'
Error processing image 142208: 'segm




In [None]:
# Check if masks exist

mask_files = os.listdir(masks_output_dir)
print(f"Number of masks created: {len(mask_files)}")
print(f"First 5 mask files: {mask_files[:5]}")

# Check file sizes
total_size = sum(os.path.getsize(os.path.join(masks_output_dir, f)) for f in mask_files)
print(f"Total disk space used: {total_size / (1024**3):.2f} GB")

Number of masks created: 0
First 5 mask files: []
Total disk space used: 0.00 GB
