## Setup Docker container for DB and install lib

In [None]:
!pip install -qU langchain_postgres
# run postgres pg_vector docker with command: docker compose up


## Setup Postgres pg_vector Vector Store and function for importing documents

In [1]:
import os
from app.db.VectorStore import VectorStore
from langchain_text_splitters import RecursiveCharacterTextSplitter
from langchain_core.documents import Document
from tqdm import tqdm
from bs4 import BeautifulSoup
from app.db.EnumDocsCollection import EnumDocsCollection

def purify_HTML(html: str)->str:
    soup = BeautifulSoup(html, features="html.parser")

    for script in soup(["script", "style"]):
        script.extract()    # rip it out

    text = soup.get_text()

    lines = (line.strip() for line in text.splitlines())
    chunks = (phrase.strip() for line in lines for phrase in line.split("  "))
    text = '\n'.join(chunk for chunk in chunks if chunk)
    return text


def import_source_documents(folder: str):
    # Split documents and store in vector db
    text_splitter = RecursiveCharacterTextSplitter(
        chunk_size=10000,
        chunk_overlap=200
    )

    vectordb = VectorStore.get_vector_store(folder)
    dir = os.path.join("../data/", folder)
    for root, d_names, f_names in os.walk(dir):
        progress_bar = tqdm(f_names)
        for file in progress_bar:
            progress_bar.set_description(file)
            if not os.path.isdir(file):
                with open(os.path.join(root, file)) as f:
                    splits = []
                    if file.endswith(".png") or file.endswith(".jpg") or file.endswith(".jpeg"):
                        continue
                    try:
                        text = f.read()
                        if file.endswith(".html"):
                            text = purify_HTML(text)
                    except Exception as e:
                        print(e)

                    for idx, chunk in enumerate(text_splitter.split_text(text)):
                        splits.append(Document(
                            page_content=chunk,
                            metadata={"source": file, "chunk_idx": idx}
                        ))
                    try:
                        vectordb.add_documents(splits)
                    except Exception as e:
                        print(e)

## Load Base Information

In [2]:
vectordb = VectorStore.get_vector_store(EnumDocsCollection.BASE_INFO.value)
vectordb.drop_tables()

2024-12-31 15:48:21.045 
  command:

    streamlit run /home/michal/anaconda3/lib/python3.12/site-packages/ipykernel_launcher.py [ARGUMENTS]


Fetching 5 files:   0%|          | 0/5 [00:00<?, ?it/s]

In [3]:
import_source_documents(EnumDocsCollection.BASE_INFO.value)

Fetching 5 files:   0%|          | 0/5 [00:00<?, ?it/s]

companyhouseWiki.txt: 100%|██████████| 2/2 [00:00<00:00,  2.58it/s]         


## Load Companyhouse Project Code

In [None]:
import_source_documents(EnumDocsCollection.COMPANYHOUSE_PROJ_CODE.value)

Fetching 5 files:   0%|          | 0/5 [00:00<?, ?it/s]

init: 100%|██████████| 4/4 [00:01<00:00,  2.40it/s]         
gulpfile.js: 100%|██████████| 4/4 [00:00<00:00,  6.30it/s]    
contact.js:  10%|█         | 4/40 [00:01<00:10,  3.30it/s]               

(psycopg.errors.NotNullViolation) null value in column "id" of relation "langchain_pg_embedding" violates not-null constraint
DETAIL:  Failing row contains (null, null, null, null, null).
[SQL: INSERT INTO langchain_pg_embedding DEFAULT VALUES ON CONFLICT (id) DO UPDATE SET embedding = excluded.embedding, document = excluded.document, cmetadata = excluded.cmetadata]
(Background on this error at: https://sqlalche.me/e/20/gkpj)


overlay.js:  32%|███▎      | 13/40 [00:03<00:05,  4.54it/s]            

## Load Framework Documentation

In [None]:
import_source_documents(EnumDocsCollection.FRAMEWORK_DOCS.value)

Fetching 5 files:   0%|          | 0/5 [00:00<?, ?it/s]

yii-apidoc-models-methoddoc.html:  42%|████▏     | 362/858 [07:42<09:49,  1.19s/it]                            

## Load Companyhouse Documentation

In [10]:
import_source_documents(EnumDocsCollection.COMPANYHOUSE_PROJ_DOCS.value)

Fetching 5 files:   0%|          | 0/5 [00:00<?, ?it/s]

Sitemaps_2239660052.html: 100%|██████████| 122/122 [00:29<00:00,  4.17it/s]                                                               
0it [00:00, ?it/s]
bullet_blue.gif:   0%|          | 0/3 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x91 in position 10: invalid start byte


grey_arrow_down.png:  67%|██████▋   | 2/3 [00:00<00:00,  4.76it/s]

'utf-8' codec can't decode byte 0xc4 in position 10: invalid continuation byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


grey_arrow_down.png: 100%|██████████| 3/3 [00:00<00:00,  4.90it/s]
wink.png:  33%|███▎      | 1/3 [00:00<00:00,  6.06it/s] 

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


smile.png: 100%|██████████| 3/3 [00:00<00:00,  5.98it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1f60e.png:   0%|          | 0/18 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2757.png:  11%|█         | 2/18 [00:00<00:02,  5.50it/s] 

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2705.png:  22%|██▏       | 4/18 [00:00<00:02,  5.71it/s] 

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2699.png:  33%|███▎      | 6/18 [00:01<00:02,  5.92it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1f4cb.png:  44%|████▍     | 8/18 [00:01<00:01,  6.02it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


274c.png:  56%|█████▌    | 10/18 [00:01<00:01,  5.92it/s] 

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1f4b5.png:  67%|██████▋   | 12/18 [00:02<00:00,  6.21it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1f935-200d-2642-fe0f.png:  72%|███████▏  | 13/18 [00:02<00:00,  6.09it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1f4c4.png:  83%|████████▎ | 15/18 [00:02<00:00,  5.71it/s]               

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1fa99.png:  94%|█████████▍| 17/18 [00:02<00:00,  5.67it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1fa99.png: 100%|██████████| 18/18 [00:03<00:00,  5.80it/s]
home_page_16.png: 100%|██████████| 1/1 [00:00<00:00,  5.29it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


0it [00:00, ?it/s]
2178842659.sh: 100%|██████████| 2/2 [00:00<00:00, 10.41it/s]
2097381380.mp4:  33%|███▎      | 2/6 [00:00<00:00, 13.41it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2098200583.png:  67%|██████▋   | 4/6 [00:01<00:00,  2.17it/s]

'utf-8' codec can't decode byte 0xeb in position 41: invalid continuation byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2098200583.png: 100%|██████████| 6/6 [00:01<00:00,  3.44it/s]
1842151433.png:   6%|▌         | 2/36 [00:00<00:02, 16.08it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1740439592:  17%|█▋        | 6/36 [00:00<00:01, 15.50it/s]    

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1839300633.png:  28%|██▊       | 10/36 [00:00<00:01, 14.95it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0xd3 in position 6: invalid continuation byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1836122231.png:  39%|███▉      | 14/36 [00:00<00:01, 14.54it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1740538048:  44%|████▍     | 16/36 [00:01<00:01, 11.70it/s]    

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1838219289.png:  50%|█████     | 18/36 [00:01<00:01,  9.95it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1841528841.png:  56%|█████▌    | 20/36 [00:01<00:01,  9.12it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1839300641.png:  61%|██████    | 22/36 [00:01<00:01,  9.56it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1827799065.png:  72%|███████▏  | 26/36 [00:02<00:00, 10.00it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1830682727.png:  78%|███████▊  | 28/36 [00:02<00:00,  9.98it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1836122217.png:  89%|████████▉ | 32/36 [00:02<00:00,  9.88it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1842151425.png:  94%|█████████▍| 34/36 [00:03<00:00,  9.61it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1842151425.png: 100%|██████████| 36/36 [00:03<00:00, 10.92it/s]
2130214955.png: 100%|██████████| 1/1 [00:00<00:00,  9.11it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2100002828.png:   0%|          | 0/5 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2100101129.png:  20%|██        | 1/5 [00:00<00:00,  7.95it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2100068357.png:  20%|██        | 1/5 [00:00<00:00,  7.95it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2100002839.png:  60%|██████    | 3/5 [00:00<00:00,  8.86it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2100002839.png: 100%|██████████| 5/5 [00:00<00:00, 10.02it/s]
2254471208.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2254471208.png: 100%|██████████| 1/1 [00:00<00:00, 11.39it/s]
2081816595.pdf: 100%|██████████| 1/1 [00:00<00:00, 10.33it/s]


'utf-8' codec can't decode byte 0xc7 in position 10: invalid continuation byte


2146697217.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2146697217.png: 100%|██████████| 1/1 [00:00<00:00, 13.74it/s]
2265743371.png:   0%|          | 0/6 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2268233740.png:   0%|          | 0/6 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2268430347.png:  33%|███▎      | 2/6 [00:00<00:00, 14.09it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2268266503.png:  33%|███▎      | 2/6 [00:00<00:00, 14.09it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2265546777.png:  67%|██████▋   | 4/6 [00:00<00:00, 14.03it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2265612307.png:  67%|██████▋   | 4/6 [00:00<00:00, 14.03it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2265612307.png: 100%|██████████| 6/6 [00:00<00:00, 13.01it/s]
2166685710.png:   0%|          | 0/6 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2166816773.png:  17%|█▋        | 1/6 [00:00<00:00,  8.90it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2166652958.png:  33%|███▎      | 2/6 [00:00<00:00,  8.95it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2166718479.png:  50%|█████     | 3/6 [00:00<00:00,  7.79it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2166849545.png:  67%|██████▋   | 4/6 [00:00<00:00,  8.03it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2166784009.png:  67%|██████▋   | 4/6 [00:00<00:00,  8.03it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2166784009.png: 100%|██████████| 6/6 [00:00<00:00,  8.31it/s]
2141126690.pdf:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xe2 in position 11: invalid continuation byte


2141126690.pdf: 100%|██████████| 1/1 [00:00<00:00,  6.22it/s]
2076737588:   0%|          | 0/2 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2076737582: 100%|██████████| 2/2 [00:00<00:00, 10.50it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


1712586841.jpg:   0%|          | 0/6 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1712586812.jpg:   0%|          | 0/6 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1712554068.jpg:  33%|███▎      | 2/6 [00:00<00:00, 13.05it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1712586824.jpg:  33%|███▎      | 2/6 [00:00<00:00, 13.05it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1712586835.jpg:  67%|██████▋   | 4/6 [00:00<00:00, 13.14it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1713307679.jpg:  67%|██████▋   | 4/6 [00:00<00:00, 13.14it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1713307679.jpg: 100%|██████████| 6/6 [00:00<00:00, 13.00it/s]
2173042698.png:   0%|          | 0/10 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2172846083.png:   0%|          | 0/10 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2172878853.png:  20%|██        | 2/10 [00:00<00:00, 12.66it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2172977168.png:  20%|██        | 2/10 [00:00<00:00, 12.66it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2172878859.png:  40%|████      | 4/10 [00:00<00:00, 12.85it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2172846095.png:  40%|████      | 4/10 [00:00<00:00, 12.85it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2172977155.png:  60%|██████    | 6/10 [00:00<00:00, 12.68it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2172977161.png:  60%|██████    | 6/10 [00:00<00:00, 12.68it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2172846101.png:  80%|████████  | 8/10 [00:00<00:00, 13.17it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2173009929.png:  80%|████████  | 8/10 [00:00<00:00, 13.17it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2173009929.png: 100%|██████████| 10/10 [00:00<00:00, 12.91it/s]
2232844306:   0%|          | 0/5 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2232844318:   0%|          | 0/5 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2232844300:  40%|████      | 2/5 [00:00<00:00, 12.44it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2232844294:  40%|████      | 2/5 [00:00<00:00, 12.44it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2232844312:  80%|████████  | 4/5 [00:00<00:00, 13.00it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2232844312: 100%|██████████| 5/5 [00:00<00:00, 12.85it/s]
2201845808.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2201845808.png: 100%|██████████| 1/1 [00:00<00:00, 12.14it/s]
2431025200.png:   0%|          | 0/14 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025167.png:   0%|          | 0/14 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025176.png:  14%|█▍        | 2/14 [00:00<00:00, 12.64it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025191.png:  14%|█▍        | 2/14 [00:00<00:00, 12.64it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025203.png:  29%|██▊       | 4/14 [00:00<00:00, 13.42it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025206.png:  29%|██▊       | 4/14 [00:00<00:00, 13.42it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025173.png:  43%|████▎     | 6/14 [00:00<00:00, 12.58it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025194.png:  43%|████▎     | 6/14 [00:00<00:00, 12.58it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025197.png:  57%|█████▋    | 8/14 [00:00<00:00, 12.43it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025185.png:  57%|█████▋    | 8/14 [00:00<00:00, 12.43it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025170.png:  71%|███████▏  | 10/14 [00:00<00:00, 12.58it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025182.png:  71%|███████▏  | 10/14 [00:00<00:00, 12.58it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025188.png:  86%|████████▌ | 12/14 [00:00<00:00, 12.32it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025179.png:  86%|████████▌ | 12/14 [00:01<00:00, 12.32it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431025179.png: 100%|██████████| 14/14 [00:01<00:00, 12.54it/s]
2442559516.png:   0%|          | 0/4 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2442559522.png:   0%|          | 0/4 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2442035244.png:  50%|█████     | 2/4 [00:00<00:00, 11.38it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2441969704.png:  50%|█████     | 2/4 [00:00<00:00, 11.38it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2441969704.png: 100%|██████████| 4/4 [00:00<00:00, 10.62it/s]
2183823367.png:   0%|          | 0/5 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2183856136.png:   0%|          | 0/5 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2183823378.png:  40%|████      | 2/5 [00:00<00:00, 12.27it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2183790604.png:  40%|████      | 2/5 [00:00<00:00, 12.27it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2183790614.png:  80%|████████  | 4/5 [00:00<00:00, 13.50it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2183790614.png: 100%|██████████| 5/5 [00:00<00:00, 13.47it/s]
2178777112.png:  17%|█▋        | 1/6 [00:00<00:00,  8.18it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2178809901.png:  33%|███▎      | 2/6 [00:00<00:00,  7.60it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2178744437.mnu: 100%|██████████| 6/6 [00:00<00:00,  6.15it/s]
2183364614.png:   0%|          | 0/4 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2183397402.png:  25%|██▌       | 1/4 [00:00<00:00,  3.78it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2183430156.png:  50%|█████     | 2/4 [00:00<00:00,  4.34it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2183364644.png: 100%|██████████| 4/4 [00:00<00:00,  4.45it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2071232550.jpg:   0%|          | 0/4 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2071363603.jpg:  25%|██▌       | 1/4 [00:00<00:00,  4.64it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2278850568.png:  75%|███████▌  | 3/4 [00:00<00:00,  4.49it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2278850568.png: 100%|██████████| 4/4 [00:00<00:00,  4.24it/s]
2320662548.png:   0%|          | 0/4 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320695306.png:  25%|██▌       | 1/4 [00:00<00:00,  4.70it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320760858.png:  50%|█████     | 2/4 [00:00<00:00,  4.72it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320990238.png:  75%|███████▌  | 3/4 [00:00<00:00,  4.01it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320990238.png: 100%|██████████| 4/4 [00:01<00:00,  3.97it/s]
2360377375.png:   0%|          | 0/23 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2359164942.png:   4%|▍         | 1/23 [00:00<00:05,  4.30it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2359001125.png:   9%|▊         | 2/23 [00:00<00:05,  4.06it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2358837300.png:  13%|█▎        | 3/23 [00:00<00:04,  4.09it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2359001144.png:  17%|█▋        | 4/23 [00:00<00:04,  4.08it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2358968358.png:  22%|██▏       | 5/23 [00:01<00:04,  4.31it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2359033885.png:  26%|██▌       | 6/23 [00:01<00:04,  3.94it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2358706212.png:  30%|███       | 7/23 [00:01<00:04,  3.99it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2358804520.png:  35%|███▍      | 8/23 [00:01<00:03,  4.11it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2359132166.png:  39%|███▉      | 9/23 [00:02<00:03,  4.24it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2360377366.png:  43%|████▎     | 10/23 [00:02<00:03,  4.29it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2358837309.png:  52%|█████▏    | 12/23 [00:02<00:02,  4.57it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2359984157.png:  57%|█████▋    | 13/23 [00:03<00:02,  4.64it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2358902813.png:  61%|██████    | 14/23 [00:03<00:01,  4.63it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2360213528.png:  70%|██████▉   | 16/23 [00:03<00:01,  4.77it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2360311826.png:  74%|███████▍  | 17/23 [00:03<00:01,  4.28it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2359164936.png:  78%|███████▊  | 18/23 [00:04<00:01,  4.30it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2360279093.png:  83%|████████▎ | 19/23 [00:04<00:00,  4.29it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2358968374.png:  87%|████████▋ | 20/23 [00:04<00:00,  4.10it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2359132179.png:  91%|█████████▏| 21/23 [00:04<00:00,  4.23it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2358837288.png:  96%|█████████▌| 22/23 [00:05<00:00,  4.22it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2358837288.png: 100%|██████████| 23/23 [00:05<00:00,  4.30it/s]
2076835844:   0%|          | 0/2 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2076573720:  50%|█████     | 1/2 [00:00<00:00,  4.29it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2076573720: 100%|██████████| 2/2 [00:00<00:00,  4.45it/s]
2077065267:   0%|          | 0/5 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2077065261:  20%|██        | 1/5 [00:00<00:00,  4.34it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2077196339:  60%|██████    | 3/5 [00:00<00:00,  4.09it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2077163537: 100%|██████████| 5/5 [00:01<00:00,  4.31it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


0it [00:00, ?it/s]
2178875407:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2178875407: 100%|██████████| 1/1 [00:00<00:00,  3.75it/s]
2081816595:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2081816595: 100%|██████████| 1/1 [00:00<00:00,  4.01it/s]
2141126690:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2141126690: 100%|██████████| 1/1 [00:00<00:00,  3.97it/s]
2178809909:   0%|          | 0/2 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2178744437:  50%|█████     | 1/2 [00:00<00:00,  3.80it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2178744437: 100%|██████████| 2/2 [00:00<00:00,  4.04it/s]
2178777105:   0%|          | 0/2 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2178908194:  50%|█████     | 1/2 [00:00<00:00,  3.36it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2178908194: 100%|██████████| 2/2 [00:00<00:00,  3.85it/s]
2067103760:   0%|          | 0/3 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1448476743:  67%|██████▋   | 2/3 [00:00<00:00,  4.46it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1448443953: 100%|██████████| 3/3 [00:00<00:00,  4.64it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1448443953: 100%|██████████| 3/3 [00:00<00:00,  4.53it/s]
2051112983:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2051112983: 100%|██████████| 1/1 [00:00<00:00,  4.06it/s]
2141126673:   0%|          | 0/3 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2141126667:  33%|███▎      | 1/3 [00:00<00:00,  3.72it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2141126670:  67%|██████▋   | 2/3 [00:00<00:00,  3.57it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2141126670: 100%|██████████| 3/3 [00:00<00:00,  3.89it/s]
2463105049:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2463105049: 100%|██████████| 1/1 [00:00<00:00,  3.44it/s]
2178908167:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2178908167: 100%|██████████| 1/1 [00:00<00:00,  4.23it/s]
2017558529:   0%|          | 0/3 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2017460227:  33%|███▎      | 1/3 [00:00<00:00,  3.94it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2017394695:  67%|██████▋   | 2/3 [00:00<00:00,  4.41it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2017394695: 100%|██████████| 3/3 [00:00<00:00,  4.23it/s]
2178744413:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2178744413: 100%|██████████| 1/1 [00:00<00:00,  3.85it/s]
2264825859.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2264825859.png: 100%|██████████| 1/1 [00:00<00:00,  4.24it/s]
1740439630.jpg:   0%|          | 0/5 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1740439624.jpg:  20%|██        | 1/5 [00:00<00:00,  4.08it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1740439636.jpg:  40%|████      | 2/5 [00:00<00:00,  3.91it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1740439611.jpg:  60%|██████    | 3/5 [00:00<00:00,  4.17it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1740439618.jpg:  80%|████████  | 4/5 [00:01<00:00,  3.88it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


1740439618.jpg: 100%|██████████| 5/5 [00:01<00:00,  3.88it/s]
2157346817.png:   0%|          | 0/3 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2157445121.png:  33%|███▎      | 1/3 [00:00<00:00,  4.32it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2157412381.png:  67%|██████▋   | 2/3 [00:00<00:00,  4.56it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2157412381.png: 100%|██████████| 3/3 [00:00<00:00,  4.61it/s]
2432663555.jpg:   0%|          | 0/29 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2431942664.jpg:   3%|▎         | 1/29 [00:00<00:10,  2.55it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2432040967.jpg:   7%|▋         | 2/29 [00:00<00:07,  3.39it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2402517000.jpg:  10%|█         | 3/29 [00:00<00:06,  3.88it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2435809319.jpg:  14%|█▍        | 4/29 [00:01<00:06,  3.60it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2402516994.jpg:  17%|█▋        | 5/29 [00:01<00:06,  3.90it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2401730623.jpg:  21%|██        | 6/29 [00:01<00:05,  4.15it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2402680839.png:  24%|██▍       | 7/29 [00:01<00:05,  4.22it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2431877122.jpg:  28%|██▊       | 8/29 [00:02<00:05,  3.60it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2432794626.jpg:  31%|███       | 9/29 [00:02<00:05,  3.88it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2423914511.jpg:  34%|███▍      | 10/29 [00:02<00:04,  4.12it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2401992718.jpg:  38%|███▊      | 11/29 [00:02<00:04,  4.32it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2402517011.jpg:  41%|████▏     | 12/29 [00:03<00:03,  4.31it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2401959952.jpg:  45%|████▍     | 13/29 [00:03<00:03,  4.10it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2402385923.jpg:  48%|████▊     | 14/29 [00:03<00:03,  4.02it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2423914505.jpg:  52%|█████▏    | 15/29 [00:03<00:03,  4.09it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2402320388.jpg:  55%|█████▌    | 16/29 [00:04<00:03,  4.12it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2432565251.jpg:  59%|█████▊    | 17/29 [00:04<00:02,  4.20it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2431909895.jpg:  62%|██████▏   | 18/29 [00:04<00:02,  4.15it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2402418690.png:  66%|██████▌   | 19/29 [00:04<00:02,  4.05it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2432925697.jpg:  69%|██████▉   | 20/29 [00:05<00:02,  3.56it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2402058244.jpg:  72%|███████▏  | 21/29 [00:05<00:02,  3.20it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2402484226.jpg:  76%|███████▌  | 22/29 [00:05<00:02,  3.02it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2436104206.jpg:  79%|███████▉  | 23/29 [00:06<00:01,  3.07it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2401959941.jpg:  83%|████████▎ | 24/29 [00:06<00:01,  3.05it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2432106507.png:  86%|████████▌ | 25/29 [00:06<00:01,  3.41it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2402680833.jpg:  90%|████████▉ | 26/29 [00:07<00:00,  3.50it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2432237582.jpg:  93%|█████████▎| 27/29 [00:07<00:00,  3.73it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2432466955.jpg:  97%|█████████▋| 28/29 [00:07<00:00,  3.90it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2432466955.jpg: 100%|██████████| 29/29 [00:07<00:00,  3.76it/s]
2170060829.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2170060829.png: 100%|██████████| 1/1 [00:00<00:00,  4.17it/s]
2170552339.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2170552339.png: 100%|██████████| 1/1 [00:00<00:00,  3.23it/s]
2178908194.txt: 100%|██████████| 2/2 [00:00<00:00,  9.03it/s]
2167963683.png:  33%|███▎      | 1/3 [00:00<00:00,  7.95it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2167963677.png: 100%|██████████| 3/3 [00:00<00:00, 10.57it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2141126707.png:   0%|          | 0/2 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2141126707.png: 100%|██████████| 2/2 [00:00<00:00, 13.21it/s]
2279702617.png:   0%|          | 0/6 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2279800903.png:   0%|          | 0/6 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2279833662.png:  33%|███▎      | 2/6 [00:00<00:00,  9.73it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2279571537.png:  67%|██████▋   | 4/6 [00:00<00:00, 11.45it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2279440461.png: 100%|██████████| 6/6 [00:00<00:00, 11.70it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2408644630.png:   0%|          | 0/3 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2408480795.png:  33%|███▎      | 1/3 [00:00<00:00,  9.66it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2408841232.png: 100%|██████████| 3/3 [00:00<00:00, 11.11it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2274983939.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2274983939.png: 100%|██████████| 1/1 [00:00<00:00, 14.13it/s]
1448476743.xls:   0%|          | 0/3 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xd0 in position 0: invalid continuation byte


1448443953.doc:   0%|          | 0/3 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xd0 in position 0: invalid continuation byte


2067103760.xlsx:  67%|██████▋   | 2/3 [00:00<00:00, 12.68it/s]

'utf-8' codec can't decode byte 0x8d in position 10: invalid start byte


2067103760.xlsx: 100%|██████████| 3/3 [00:00<00:00, 10.91it/s]
2341339160.png: 100%|██████████| 1/1 [00:00<00:00, 15.12it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2051112983.pdf:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xe2 in position 10: invalid continuation byte


2051112983.pdf: 100%|██████████| 1/1 [00:00<00:00, 11.63it/s]
2320990224.png:   0%|          | 0/27 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2273902639.png:   0%|          | 0/27 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320596995.png:   7%|▋         | 2/27 [00:00<00:02, 11.80it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320629766.png:   7%|▋         | 2/27 [00:00<00:02, 11.80it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320859144.png:  15%|█▍        | 4/27 [00:00<00:01, 12.10it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2273706009.png:  15%|█▍        | 4/27 [00:00<00:01, 12.10it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2273706016.png:  22%|██▏       | 6/27 [00:00<00:01, 11.55it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320990210.png:  22%|██▏       | 6/27 [00:00<00:01, 11.55it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2273837111.png:  30%|██▉       | 8/27 [00:00<00:01, 10.80it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2279669845.png:  30%|██▉       | 8/27 [00:00<00:01, 10.80it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2279669868.png:  37%|███▋      | 10/27 [00:00<00:01, 10.03it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320924675.png:  44%|████▍     | 12/27 [00:01<00:01, 10.70it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320859137.png:  44%|████▍     | 12/27 [00:01<00:01, 10.70it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2273640525.png:  52%|█████▏    | 14/27 [00:01<00:01, 11.26it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320957441.png:  59%|█████▉    | 16/27 [00:01<00:00, 11.69it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320564240.png:  67%|██████▋   | 18/27 [00:01<00:00, 12.13it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2320564228.png:  67%|██████▋   | 18/27 [00:01<00:00, 12.13it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2280259585.png:  74%|███████▍  | 20/27 [00:01<00:00, 12.16it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2273673258.png:  81%|████████▏ | 22/27 [00:01<00:00, 12.85it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2273640539.jpg:  89%|████████▉ | 24/27 [00:02<00:00, 12.41it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2273837118.jpg:  89%|████████▉ | 24/27 [00:02<00:00, 12.41it/s]

'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2320990217.png: 100%|██████████| 27/27 [00:02<00:00, 11.92it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2226389215.png:   0%|          | 0/6 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2226520185.png:   0%|          | 0/6 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2226520157.png:  33%|███▎      | 2/6 [00:00<00:00, 12.61it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2226290791.png:  33%|███▎      | 2/6 [00:00<00:00, 12.61it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2226356369.png:  67%|██████▋   | 4/6 [00:00<00:00, 12.55it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2226258045.png:  67%|██████▋   | 4/6 [00:00<00:00, 12.55it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2226258045.png: 100%|██████████| 6/6 [00:00<00:00, 12.86it/s]
2092793957.png:   0%|          | 0/10 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2227929113.png:   0%|          | 0/10 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2228125713.png:  20%|██        | 2/10 [00:00<00:00, 12.50it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2228191241.png:  20%|██        | 2/10 [00:00<00:00, 12.50it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093088790.png:  40%|████      | 4/10 [00:00<00:00, 12.20it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093088784.png:  40%|████      | 4/10 [00:00<00:00, 12.20it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2185396233.png:  60%|██████    | 6/10 [00:00<00:00, 12.04it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2228027423.png:  60%|██████    | 6/10 [00:00<00:00, 12.04it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2092957708.png:  80%|████████  | 8/10 [00:00<00:00, 11.13it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2092499075.png:  80%|████████  | 8/10 [00:00<00:00, 11.13it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2092499075.png: 100%|██████████| 10/10 [00:00<00:00, 10.83it/s]
2344189991.png: 100%|██████████| 1/1 [00:00<00:00, 11.19it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2096234497.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2096234497.png: 100%|██████████| 1/1 [00:00<00:00,  9.31it/s]
2226651139.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2226651139.png: 100%|██████████| 1/1 [00:00<00:00, 10.50it/s]
2141159437.png:   0%|          | 0/2 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2141159437.png: 100%|██████████| 2/2 [00:00<00:00, 11.77it/s]
2175565853.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2175565853.png: 100%|██████████| 1/1 [00:00<00:00,  9.77it/s]
2186051600.png:   0%|          | 0/4 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2186313729.png:  25%|██▌       | 1/4 [00:00<00:00,  9.58it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2186182664.png:  75%|███████▌  | 3/4 [00:00<00:00, 12.10it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2186182664.png: 100%|██████████| 4/4 [00:00<00:00, 11.59it/s]
2441642079.png:   0%|          | 0/12 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2441642061.png:  17%|█▋        | 2/12 [00:00<00:00, 11.94it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2441642042:  33%|███▎      | 4/12 [00:00<00:00, 12.93it/s]    

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0xff in position 0: invalid start byte


2441642109.png:  33%|███▎      | 4/12 [00:00<00:00, 12.93it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2441642049.png:  50%|█████     | 6/12 [00:00<00:00, 12.19it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2441642091.png:  67%|██████▋   | 8/12 [00:00<00:00, 12.31it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2441642055.png:  83%|████████▎ | 10/12 [00:00<00:00, 12.69it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2441642085.png:  83%|████████▎ | 10/12 [00:00<00:00, 12.69it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2441642085.png: 100%|██████████| 12/12 [00:00<00:00, 12.73it/s]
2141126673.pdf:   0%|          | 0/3 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0xe2 in position 11: invalid continuation byte
'utf-8' codec can't decode byte 0xe2 in position 11: invalid continuation byte


2141126667.pdf:  67%|██████▋   | 2/3 [00:00<00:00, 12.36it/s]

'utf-8' codec can't decode byte 0xe2 in position 11: invalid continuation byte


2141126667.pdf: 100%|██████████| 3/3 [00:00<00:00, 12.55it/s]
2093416464.png:   0%|          | 0/16 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093154344.png:  12%|█▎        | 2/16 [00:00<00:01, 11.93it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093318164.png:  25%|██▌       | 4/16 [00:00<00:00, 12.77it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093252627.png:  25%|██▌       | 4/16 [00:00<00:00, 12.77it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093383681.png:  38%|███▊      | 6/16 [00:00<00:01,  9.09it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093416449.png:  38%|███▊      | 6/16 [00:00<00:01,  9.09it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093318180.png:  50%|█████     | 8/16 [00:00<00:00,  8.80it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093121563.png:  56%|█████▋    | 9/16 [00:01<00:00,  8.90it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093121583.png:  69%|██████▉   | 11/16 [00:01<00:00,  9.45it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2092990493.png:  81%|████████▏ | 13/16 [00:01<00:00,  9.25it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2093318191.png: 100%|██████████| 16/16 [00:01<00:00,  9.90it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2463105049: 100%|██████████| 1/1 [00:04<00:00,  4.75s/it]
2178908167.sh: 100%|██████████| 1/1 [00:00<00:00,  6.74it/s]
2076246031:  17%|█▋        | 1/6 [00:00<00:00,  6.53it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2076246063:  50%|█████     | 3/6 [00:00<00:00,  7.58it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2076246048:  83%|████████▎ | 5/6 [00:00<00:00,  7.59it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2076246048: 100%|██████████| 6/6 [00:00<00:00,  7.47it/s]
2065694727.js: 100%|██████████| 2/2 [00:00<00:00,  5.85it/s]  
2427224116.png:  50%|█████     | 1/2 [00:00<00:00,  6.81it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2427224116.png: 100%|██████████| 2/2 [00:00<00:00,  8.16it/s]
2041905246.png:  12%|█▎        | 1/8 [00:00<00:01,  6.97it/s]

'utf-8' codec can't decode byte 0xb5 in position 11: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2017558529.pdf:  38%|███▊      | 3/8 [00:00<00:00,  6.78it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0xb5 in position 11: invalid start byte


2041741480.png:  75%|███████▌  | 6/8 [00:00<00:00,  8.68it/s]

'utf-8' codec can't decode byte 0xc7 in position 10: invalid continuation byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte
'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2042429532.png: 100%|██████████| 8/8 [00:00<00:00,  8.39it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2178744413.sh: 100%|██████████| 1/1 [00:00<00:00,  8.92it/s]
2151415815.png: 100%|██████████| 1/1 [00:00<00:00,  9.72it/s]


'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2134179870.png:   0%|          | 0/1 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2134179870.png: 100%|██████████| 1/1 [00:00<00:00,  8.72it/s]
2176352260.png:   0%|          | 0/8 [00:00<?, ?it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2176024617.png:  12%|█▎        | 1/8 [00:00<00:00,  8.42it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2176352266.png:  25%|██▌       | 2/8 [00:00<00:00,  8.04it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2175926280.png:  38%|███▊      | 3/8 [00:00<00:00,  8.07it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2176090140.png:  50%|█████     | 4/8 [00:00<00:00,  8.44it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2176483329.png:  62%|██████▎   | 5/8 [00:00<00:00,  8.90it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2176450572.png:  75%|███████▌  | 6/8 [00:00<00:00,  8.80it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2176122890.png:  88%|████████▊ | 7/8 [00:00<00:00,  8.62it/s]

'utf-8' codec can't decode byte 0x89 in position 0: invalid start byte


2176122890.png: 100%|██████████| 8/8 [00:00<00:00,  8.24it/s]
