## Load captions

You can get 5 captions for each of the 1200 images included in the ImageNetTraining dataset.

In [13]:
import numpy as np
import pandas as pd

df = pd.read_csv("data/ImageNetTraining_captions.csv")

# Load image id list (1200 images)
image_id_list = sorted(np.unique(list(df["image_id"].values)))
print("Image id list")
print(image_id_list)

# Read category id list (150 categories) 
category_id_list = sorted(np.unique([image_id.split("_")[0] for image_id in image_id_list]))
print("Category id list")
print(category_id_list)

Image id list
['n01518878_10042', 'n01518878_12028', 'n01518878_14075', 'n01518878_14910', 'n01518878_5958', 'n01518878_7346', 'n01518878_7579', 'n01518878_8432', 'n01639765_22407', 'n01639765_32862', 'n01639765_37122', 'n01639765_40261', 'n01639765_44823', 'n01639765_47681', 'n01639765_48759', 'n01639765_52902', 'n01645776_10130', 'n01645776_10758', 'n01645776_8522', 'n01645776_8879', 'n01645776_9361', 'n01645776_9576', 'n01645776_9693', 'n01645776_9743', 'n01664990_10648', 'n01664990_13731', 'n01664990_16740', 'n01664990_18293', 'n01664990_19129', 'n01664990_19923', 'n01664990_65', 'n01664990_7133', 'n01704323_10031', 'n01704323_10239', 'n01704323_10394', 'n01704323_5092', 'n01704323_8008', 'n01704323_8767', 'n01704323_9172', 'n01704323_9812', 'n01726692_18809', 'n01726692_21053', 'n01726692_30357', 'n01726692_31558', 'n01726692_8404', 'n01726692_8752', 'n01726692_8975', 'n01726692_9090', 'n01768244_10258', 'n01768244_11944', 'n01768244_6450', 'n01768244_7012', 'n01768244_7788', 'n01

In [14]:
# Load captions (6000 captions)
for image_id in image_id_list[:3]: # only 3
    print(image_id)
    # 5 captions for each image
    captions = df.query("image_id == '{}'".format(image_id))["caption"].values
    print(captions)


n01518878_10042
['A brown and tan ostridge walking near a metal building,'
 'Brown feathered ostrich with white head and neck facing to the left, standing near a metal or aluminum type fencing.'
 'An ostrich with ruffled feathers looks in the direction of a green building.'
 'A brown ostrich is looking the direction of a green wall.'
 'a ostrich standing near a fence and looking at something']
n01518878_12028
['The head of an ostridge looking over a metal fence.'
 'An emu or ostrich with an un-amused expression is looking in the direction of the camera.'
 'An ostrich with fuzzy hair on its head looks over a wire fence.'
 'A serious looking ostrich peers out over a wire fence.'
 'A close up image of a disappointed looking ostrich.']
n01518878_14075
['A brown ostridge with its beak open walking in a field of dead grass.'
 'A large bird holds its beak open and stands in some brown grass.'
 'An ostrich with its beak open walks through long, dry grasses.'
 'An ostrich standing in the middle

## Load category information

ImageNetTraining image stimuli were obtained from [ImageNet](https://www.image-net.org/), whose ImageNet IDs are derived from [WordNet](https://wordnet.princeton.edu/ ) synset. 
You can read the corresponding WordNet synonyms for the 150 categories included in ImageNetTraining. (If you would like to access  more detailed information, please use the `nltk` library.)

In [15]:
df_cat = pd.read_csv("data/ImageNetTraining_category.csv")

for category_id in category_id_list[:3]: # only 3
    print(category_id)
    synonyms = df_cat.query("synset == '{}'".format(category_id))["synonym"].values[0]
    print(synonyms)

n01518878
ostrich
n01639765
frog
n01645776
true toad
