In [1]:
%run -i ../../src/reload.py
import src
import config

In [25]:
import shutil
from tqdm import tqdm

In [7]:
addrs_ds = src.utils.read_json(config.dataset_dir / 'addrs.json')
tokens_ds = src.utils.read_json(config.dataset_dir / 'tokens.json')

In [12]:
ecd = config.export_cache_dir
ecd.mkdir(exist_ok=True)
(ecd / 'accounts_metadata').mkdir(exist_ok=True)
(ecd / 'accounts_metadata' / 'logos').mkdir(exist_ok=True)
(ecd / 'ipfs0').mkdir(exist_ok=True)
(ecd / 'previews').mkdir(exist_ok=True)
(ecd / 'previews' / 'thumbs_256x256').mkdir(exist_ok=True)
(ecd / 'transactions' / config.transactions_dir.name).mkdir(exist_ok=True, parents=True)

In [None]:
print('Copying logos...')

for addr_ds_entry in tqdm(addrs_ds.values()):
    if addr_ds_entry['ban_status'] != '':
        continue
    logo_file = config.tzktio_accounts_logos_dir / (addr_ds_entry['address'] + '.png')
    if logo_file.exists():
        shutil.copy(logo_file, ecd / 'accounts_metadata' / 'logos' / logo_file.name)

In [33]:
print('Copying tokens 256x256 thumbs...')

for token_ds_entry in tqdm(tokens_ds.values()):
    if token_ds_entry['ban_status'] != '':
        continue
    token_preview_file = config.previews_dir / 'thumbs_256x256' / (token_ds_entry['artifact_ipfs'] + '.jpeg')
    target_token_preview_file = ecd / 'previews' / 'thumbs_256x256' / token_preview_file.name
    if token_preview_file.exists() and not target_token_preview_file.exists():
        shutil.copy(token_preview_file, target_token_preview_file)

  7%|█████████▋                                                                                                                                 | 1704/24567 [00:00<00:02, 8257.24it/s]

Copying tokens 256x256 thumbs...


100%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 24567/24567 [00:03<00:00, 6796.75it/s]


In [26]:
print('Copying tokens metadata...')

for token_ds_entry in tqdm(tokens_ds.values()):
    token_ipfs0_file = config.ipfs0_dir / token_ds_entry['info_ipfs']
    if token_preview_file.exists():
        shutil.copy(token_ipfs0_file, ecd / 'ipfs0' / token_ipfs0_file.name)

  0%|                                                                                                                                                        | 0/24567 [00:00<?, ?it/s]

Copying tokens metadata...


100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 24567/24567 [04:47<00:00, 85.41it/s]


In [28]:
print('Copying single files...')

shutil.copy(
    config.tzktio_accounts_metadata_file,
    ecd / 'accounts_metadata' / config.tzktio_accounts_metadata_file.name,
)

shutil.copy(
    config.previews_dimensions_cache_file,
    ecd / 'previews' / config.previews_dimensions_cache_file.name,
)

Copying single files...


WindowsPath('D:/PycharmProjects/hicetnunc-dataset/export_cache/previews/dimensions.json')

In [29]:
print('Copying transactions...')

for tr_file in tqdm(list(config.transactions_dir.iterdir())):
    if 'invalid' in tr_file.name:
        continue
    shutil.copy(tr_file, ecd / 'transactions' / tr_file.parent.name / tr_file.name)

2it [00:00, 15.63it/s]

Copying transactions...


35it [01:30,  2.58s/it]


In [32]:
import shutil

print('Making cache.zip archive...')

shutil.make_archive(config.export_cache_archive_file.stem, 'zip', ecd)

'D:\\PycharmProjects\\hicetnunc-dataset\\cache.zip.zip'

In [3]:
import shutil

print('Making dataset.zip archive...')

shutil.make_archive(config.export_dataset_archive_file.with_suffix(''), 'zip', config.dataset_dir)

Making dataset.zip archive...


'D:\\PycharmProjects\\hicetnunc-dataset\\dataset.zip'

In [34]:
ewd = config.website_repo_dir / 'hicetnunc'

In [35]:
if ewd.is_dir():
    print('WEBSITE: Copying logos...')
    (ewd / 'user_logos').mkdir(exist_ok=True)

    for addr_ds_entry in tqdm(addrs_ds.values()):
        if addr_ds_entry['ban_status'] != '':
            continue
        logo_file = config.tzktio_accounts_logos_dir / (addr_ds_entry['address'] + '.png')
        target_logo_file = ewd / 'user_logos' / logo_file.name
        if logo_file.exists() and not target_logo_file.exists():
            shutil.copy(logo_file, target_logo_file)

  0%|                                                                                                                                                         | 0/4719 [00:00<?, ?it/s]

WEBSITE: Copying logos...


100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 4719/4719 [00:04<00:00, 1122.49it/s]


In [36]:
if ewd.is_dir():
    print('WEBSITE: Copying tokens 256x256 thumbs...')
    (ewd / 'token_thumbs').mkdir(exist_ok=True)
    for token_ds_entry in tqdm(tokens_ds.values()):
        if token_ds_entry['ban_status'] != '':
            continue
        token_preview_file = config.previews_dir / 'thumbs_256x256' / (token_ds_entry['artifact_ipfs'] + '.jpeg')
        target_token_preview_file = ewd / 'token_thumbs' / (token_ds_entry['token_id'] + '.jpeg')
        if token_preview_file.exists() and not target_token_preview_file.exists():
            shutil.copy(token_preview_file, target_token_preview_file)

  0%|                                                                                                                                               | 10/24567 [00:00<04:06, 99.66it/s]

WEBSITE: Copying tokens 256x256 thumbs...


100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 24567/24567 [04:52<00:00, 84.04it/s]
