In [1]:
import os
import pandas as pd
import cv2
import pytesseract
from PIL import Image
from tqdm import tqdm

def extract_text_pytesseract(img_path):
    img = cv2.imread(img_path)
    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
    gray = cv2.adaptiveThreshold(
        gray, 255,
        cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
        cv2.THRESH_BINARY, 11, 2
    )
    text = pytesseract.image_to_string(
        gray,
        lang="eng",
        config="--psm 6"
    )
    return text.strip()

# Ventile 1 e 20
df = pd.read_csv("./complete_viral_dataset.csv")
df = df[df["Ventile"].isin([1, 20])].reset_index(drop=True)
df["ocr_text"] = ""

# Processando o OCR
root_dir = "reddit-virality-dataset"
for idx, row in tqdm(df.iterrows(), total=len(df)):
    ventile  = row["Ventile"]
    filename = row["Filename"]
    img_path = os.path.join(root_dir, f"Ventile_{ventile}", filename)
    if os.path.isfile(img_path):
        try:
            df.at[idx, "ocr_text"] = extract_text_pytesseract(img_path)
        except Exception as e:
            print(f"Erro ao processar {img_path}")
            print("Erro:", {e})
            df.at[idx, "ocr_text"] = ""
    else:
        df.at[idx, "ocr_text"] = ""
        
df.to_csv("complete_viral_dataset_ventiles1_20_with_ocr.csv", index=False)
print("Novo CSV gerado: complete_viral_dataset_ventiles1_20_with_ocr.csv")

  0%|          | 3/1700 [00:00<02:15, 12.57it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/ea9p6np4ldcc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/x7o2a4vzp8cc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/yz5avbuaohcc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/f738top4qgcc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/psp1ftqt35cc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  0%|          | 6/1700 [00:00<01:30, 18.81it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/w6m2p5d4bdcc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/omzjuz5m61cc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/u4j3mqqv81cc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  1%|          | 13/1700 [00:00<01:29, 18.91it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/yciitt13lvbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/4zkf2l2eq3cc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/jqhu8o6wkmbc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/ddqduu5pakbc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/gt48dr3t0jbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar 

  1%|          | 17/1700 [00:00<01:27, 19.26it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/yv3qzbip0fbc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/8ptnqon7vzac1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/pm6za6rspxac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  1%|          | 20/1700 [00:01<01:23, 20.23it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/lcoo7izemqac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/ipvondezanac1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  1%|▏         | 23/1700 [00:01<02:14, 12.43it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/cq4urbl04zac1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/oeap8zcvgkac1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/8ey548loqdac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/h32mmpjwddac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/owxbfcbeqmac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  2%|▏         | 26/1700 [00:01<01:59, 13.99it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/a942wiupylac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/y5xi9p9oa7ac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  2%|▏         | 34/1700 [00:02<02:13, 12.51it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/bsrwmu1rq3ac1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/ybpu0ylmyq9c1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/lutgugajop9c1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/g8wgibvk9o9c1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/6i43jqbfak9c1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar

  2%|▏         | 40/1700 [00:02<01:32, 17.98it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/1dklxoo45v8c1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/g002hguckn8c1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/zxdsi4t0oj8c1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/j182132bqg8c1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/joy7dx1odbcc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar 

  3%|▎         | 46/1700 [00:02<01:21, 20.37it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/s2hvuxb648cc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/cn8h7pq3f8cc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/azweps80mhcc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/6no0kyb1fhcc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/2x1hd3u61ecc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  3%|▎         | 49/1700 [00:03<01:37, 16.90it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/o9w2nrn7e2cc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/1xpp9m6wmdcc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/yfi0651qaccc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/vtyjtygj8gcc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/1hmevbbenybc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  3%|▎         | 54/1700 [00:03<01:22, 19.92it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/jg00bt7z2ybc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/y4h8n97hmccc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/ass0huz308cc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/ut5p5074bwbc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  4%|▎         | 60/1700 [00:03<01:16, 21.54it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/n2na38hnpccc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/26kga7fxytbc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/es50s2brztbc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/9yhyzia5csbc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/zsc1bav7wrbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar r

  4%|▍         | 66/1700 [00:03<01:13, 22.24it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/vo3jj528oqbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/sdv9f5rjoacc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/91gig6i2o7cc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/7t78yos82acc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/4q38krnpeobc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  4%|▍         | 69/1700 [00:04<01:23, 19.42it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/tvuoh49grnbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/3liy79uuv1cc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/dzaoaud6jzbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/udkkhokhclbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/4ec24x05dibc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  4%|▍         | 75/1700 [00:04<01:31, 17.68it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/on8mc9usihbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/89l55sa3thbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/wyjtrdq5ksbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/ravispbr3gbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  5%|▍         | 80/1700 [00:04<01:22, 19.69it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/un29h7dlqebc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/jmpth0fxaebc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/jetvslm4gbbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/pivwdyvarabc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/nmyscojf3abc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processa

  5%|▌         | 87/1700 [00:05<01:31, 17.60it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/ibg60plpnpbc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/btj7zhsizobc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/ach2yu7ds7bc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/gftdy5mml6bc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/ol4d5o1gxobc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar 

  6%|▌         | 94/1700 [00:05<01:15, 21.25it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/3eud94v3u0bc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/8xbzc621f0bc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/sv5gl2ar2ibc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/qhey8q458wac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/1rog5fxfkabc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  6%|▌         | 97/1700 [00:05<01:22, 19.45it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/x9z975rkr9bc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/78qi4zaxt7bc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/sud1wfkkwoac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/0nzx5qy1cpac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/k4jdu3mo3pac1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  6%|▌         | 103/1700 [00:05<01:21, 19.63it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/g45nq5rfk7bc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/n4yklxmoynac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/1s11p1ulgmac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/nr2uzgzsn3bc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  6%|▌         | 106/1700 [00:06<01:17, 20.59it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/f10jzvltp3bc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/kkzny749o2bc1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/gyrct0sev3bc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/hpw0w1bm91bc1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/tzsn2mr18gac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  7%|▋         | 112/1700 [00:06<01:11, 22.10it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/59940ogl1vac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/8z3kxhwncfac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/1nx2mhhtiuac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/lbtkcyn0x8ac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/qea9g91388ac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  7%|▋         | 115/1700 [00:06<01:22, 19.10it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/f0om4mjjeqac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/6uqsyhv9l4ac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/5wngpdepc4ac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  7%|▋         | 121/1700 [00:06<01:22, 19.24it/s]

Erro ao processar reddit-virality-dataset/Ventile_1/i3jo1uk90oac1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/D6T8n5S.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/1wbxos5sdhac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/aeyxvcjno0ac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/vi332ta7ikac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  7%|▋         | 124/1700 [00:07<01:30, 17.37it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/t83co9u9vz9c1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/3a0io0xhby9c1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/qpgsw3t7oiac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/5mwyrjd69iac1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/jl1de3tdxhac1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}


  8%|▊         | 131/1700 [00:07<01:13, 21.38it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/19oas3aqnx9c1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/8b5wfuh2qw9c1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/ngwjtsmn8cac1.jpeg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_1/4b39w08ce9ac1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/29i5eci7pzua1.jpg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar re

  8%|▊         | 138/1700 [00:07<01:26, 18.15it/s]

Erro ao processar reddit-virality-dataset/Ventile_20/f4tyjk7u7hua1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/htyfqjnnprta1.jpg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/9n9gmh283jta1.jpg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/n8fze7s9w1ta1.png
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar reddit-virality-dataset/Ventile_20/da7xpx1h2zsa1.jpg
Erro: {TesseractNotFoundError("tesseract is not installed or it's not in your PATH. See README file for more information.")}
Erro ao processar re




KeyboardInterrupt: 